diff --git a/www/services/bibliometrix_etl/README.md b/www/services/bibliometrix_etl/README.md new file mode 100644 index 000000000..4b933a73e --- /dev/null +++ b/www/services/bibliometrix_etl/README.md @@ -0,0 +1,88 @@ +# Bibliometrix Python ETL Project + +## Project Overview + +This project implements a Python ETL pipeline for converting heterogeneous bibliographic data into a Web of Science-like schema that can be used by Bibliometrix-Python. + +The project supports both base-level and advanced-level requirements. + +## Problem + +Bibliographic data from different sources such as Scopus, Dimensions, PubMed, and OpenAlex have different formats and field names. Bibliometrix-Python requires a consistent schema similar to Web of Science field tags. + +This project solves the problem by building a source-agnostic ETL pipeline. + +## ETL Pipeline + +The pipeline follows three main stages: + +1. Extract +2. Transform +3. Load + +### Extract + +The extraction module supports: + +- Local CSV/XLSX/TXT files for the base level +- OpenAlex API retrieval for the advanced level + +### Transform + +The transformation module converts raw source fields into standard Web of Science-like tags such as: + +- TI: Title +- AU: Authors +- PY: Publication Year +- SO: Source Title +- DI: DOI +- AB: Abstract +- TC: Times Cited +- SR: Short Reference + +### Load + +The final standardized data is exported as CSV files in the `outputs` folder. + +## Project Structure + +```text +Bibliometrix_ETL_Project +├── data_raw +├── outputs +├── report +└── src + ├── mappings.py + ├── utils.py + ├── extractors.py + ├── transformer.py + ├── validator.py + └── main.py + + How to Run + +Install required packages: +python -m pip install pandas requests openpyxl + +Run the project: +python .\src\main.py + +Generated Outputs + +After running the project, the following files are generated: + +outputs/raw_openalex_records.csv +outputs/standardized_openalex_api.csv +outputs/standardized_scopus_sample.csv +outputs/validation_report_openalex.txt +outputs/validation_report_scopus.txt + +Validation + +The validation module checks: + +Required columns are present +No null values exist in the final DataFrame +Multi-value columns are stored correctly before CSV export + +The project successfully produces standardized bibliographic data and validation reports. \ No newline at end of file diff --git a/www/services/bibliometrix_etl/data_raw/scopus_sample.csv b/www/services/bibliometrix_etl/data_raw/scopus_sample.csv new file mode 100644 index 000000000..e9e2feea3 --- /dev/null +++ b/www/services/bibliometrix_etl/data_raw/scopus_sample.csv @@ -0,0 +1,4 @@ +Authors,Author full names,Title,Year,Source title,Volume,Issue,Page start,Page end,Cited by,DOI,Abstract,Author Keywords,Index Keywords,Affiliations,References,Document Type,Language of Original Document,EID +Smith J.; Rahman A.,"Smith, John; Rahman, Ahmed",Bibliometric Analysis of Artificial Intelligence Research,2024,Journal of Data Science,12,2,101,115,15,https://doi.org/10.1000/sample1,This study analyzes artificial intelligence research using bibliometric methods.,bibliometrics; artificial intelligence; research trends,data science; scientometrics,Nanjing University of Information Science and Technology; University of Dhaka,Reference A; Reference B; Reference C,Article,English,SCOPUS-ID-001 +Chen L.; Karim M.,"Chen, Li; Karim, Mohammad",OpenAlex Data Standardization for Bibliometrix Python,2023,Scientometrics Review,8,1,55,70,9,doi:10.1000/sample2,This paper discusses data standardization challenges in Python bibliometric tools.,OpenAlex; ETL; bibliometrix; Python,metadata; data pipeline,Nanjing University of Information Science and Technology,Reference X; Reference Y,Conference Paper,English,SCOPUS-ID-002 +Lee K.; Hasan R.,"Lee, Kim; Hasan, Rakib",A Source-Agnostic ETL Pipeline for Bibliographic Data,2022,International Journal of Information Systems,15,4,201,220,22,10.1000/sample3,The study proposes an ETL pipeline for heterogeneous bibliographic data sources.,ETL; bibliographic data; data transformation,information systems; metadata conversion,University of Malaya; Nanjing University of Information Science and Technology,Reference M; Reference N; Reference O,Article,English,SCOPUS-ID-003 diff --git a/www/services/bibliometrix_etl/execution_log.md b/www/services/bibliometrix_etl/execution_log.md new file mode 100644 index 000000000..57a5279f3 --- /dev/null +++ b/www/services/bibliometrix_etl/execution_log.md @@ -0,0 +1,66 @@ +# Execution Log + +## Project Name + +Bibliometrix Python ETL Project + +## Objective + +The objective of this project is to build a Python ETL pipeline that converts heterogeneous bibliographic records into a Web of Science-like schema compatible with Bibliometrix-Python. + +## Environment + +Python packages used: + +- pandas +- requests +- openpyxl + +## Command Used + +```bash +python .\src\main.py + +Base Level Execution + +The base-level pipeline used a local Scopus-like CSV file. + +Input file: + +data_raw/scopus_sample.csv + +Generated files: + +outputs/standardized_scopus_sample.csv +outputs/scopus_first_5_normalized_rows.csv +outputs/validation_report_scopus.txt + +Validation result: + +PASSED: Standardized data is valid. +Advanced Level Execution + +The advanced-level pipeline used the OpenAlex API. + +API query: + +bibliometric analysis + +Generated files: + +outputs/raw_openalex_records.csv +outputs/standardized_openalex_api.csv +outputs/openalex_first_5_normalized_rows.csv +outputs/validation_report_openalex.txt + +Validation result: + +PASSED: Standardized data is valid. +Final Terminal Result + +The terminal showed: + +PROJECT EXECUTION COMPLETED +Conclusion + +The ETL pipeline successfully extracted records from both a local file and the OpenAlex API, transformed them into a Web of Science-like schema, validated the standardized data, and exported CSV outputs. \ No newline at end of file diff --git a/www/services/bibliometrix_etl/outputs/analysis_validation_report.txt b/www/services/bibliometrix_etl/outputs/analysis_validation_report.txt new file mode 100644 index 000000000..eee7383b1 --- /dev/null +++ b/www/services/bibliometrix_etl/outputs/analysis_validation_report.txt @@ -0,0 +1,118 @@ +Bibliometrix ETL Analysis Validation Report +====================================================================== + +====================================================================== +Analysis Validation for: Base Level - Scopus Local File +====================================================================== + +1. Total Records +Total records: 3 + +2. Publications by Year +PY +2022 1 +2023 1 +2024 1 + +3. Top Source Titles +SO +Journal of Data Science 1 +Scientometrics Review 1 +International Journal of Information Systems 1 + +4. Top Authors +Smith J. 1 +Rahman A. 1 +Chen L. 1 +Karim M. 1 +Lee K. 1 +Hasan R. 1 + +5. Top Keywords or Index Terms +ETL 2 +bibliometrics 1 +artificial intelligence 1 +research trends 1 +OpenAlex 1 +bibliometrix 1 +Python 1 +bibliographic data 1 +data transformation 1 + +6. Citation Summary +Total citations: 46 +Average citations: 15.33 +Maximum citations: 22 + +Validation Status: PASSED +The standardized CSV file can be used for bibliometric-style analysis. + +====================================================================== +Analysis Validation for: Advanced Level - OpenAlex API +====================================================================== + +1. Total Records +Total records: 50 + +2. Publications by Year +PY +2005 1 +2007 1 +2009 2 +2010 1 +2014 1 +2015 8 +2016 2 +2017 5 +2018 6 +2019 7 +2020 7 +2021 3 +2022 3 +2023 2 +2024 1 + +3. Top Source Titles +SO +Journal of Business Research 8 +Scientometrics 4 +Sustainability 3 +International Journal of Production Economics 2 +El Profesional de la Informacion 1 +International Journal of Consumer Studies 1 +Encyclopedia 1 +Journal of the Association for Information Science and Technology 1 +Omega 1 +Journal of Scientometric Research 1 + +4. Top Authors +Satish Kumar 7 +José M. Merigó 4 +Naveen Donthu 3 +Nitesh Pandey 3 +Weng Marc Lim 3 +Enrique Herrera‐Viedma 3 +Manuel J. Cobo 2 +Domingo Ribeiro Soriano 2 +Debidutta Pattnaik 2 +Debmalya Mukherjee 1 + +5. Top Keywords or Index Terms +Computer science 43 +Bibliometrics 35 +Political science 30 +Library science 29 +Data science 26 +Sociology 21 +Citation 18 +MEDLINE 17 +Field (mathematics) 15 +Engineering 13 + +6. Citation Summary +Total citations: 71312 +Average citations: 1426.24 +Maximum citations: 19703 + +Validation Status: PASSED +The standardized CSV file can be used for bibliometric-style analysis. \ No newline at end of file diff --git a/www/services/bibliometrix_etl/outputs/openalex_first_5_normalized_rows.csv b/www/services/bibliometrix_etl/outputs/openalex_first_5_normalized_rows.csv new file mode 100644 index 000000000..e523e7a57 --- /dev/null +++ b/www/services/bibliometrix_etl/outputs/openalex_first_5_normalized_rows.csv @@ -0,0 +1,6 @@ +DB,UT,DI,PMID,TI,SO,JI,PY,DT,LA,TC,AU,AF,C1,RP,CR,DE,ID,AB,VL,IS,BP,EP,SR +OPENALEX,W3160856016,10.1016/j.jbusres.2021.04.070,,How to conduct a bibliometric analysis: An overview and guidelines,Journal of Business Research,,2021,article,en,12082,Naveen Donthu; Satish Kumar; Debmalya Mukherjee; Nitesh Pandey; Weng Marc Lim,Naveen Donthu; Satish Kumar; Debmalya Mukherjee; Nitesh Pandey; Weng Marc Lim,Georgia State University; Malaviya National Institute of Technology Jaipur; Swinburne University of Technology Sarawak Campus; University of Akron; Malaviya National Institute of Technology Jaipur; Swinburne University of Technology; Swinburne University of Technology Sarawak Campus,,,Bibliometrics; Field (mathematics); Data science; Resource (disambiguation); Computer science; Management science; Focus (optics); Library science; Engineering; Mathematics,Bibliometrics; Field (mathematics); Data science; Resource (disambiguation); Computer science; Management science; Focus (optics); Library science; Engineering; Mathematics; Computer network; Physics; Optics; Pure mathematics,,,,,,"Naveen Donthu, 2021, Journal of Business Research" +OPENALEX,W1021000864,10.1007/s11192-015-1645-z,,The bibliometric analysis of scholarly production: How great is the impact?,Scientometrics,,2015,article,en,2987,Ole Ellegaard; Johan Albert Wallin,Ole Ellegaard; Johan Albert Wallin,University of Southern Denmark; University of Southern Denmark,,,Bibliometrics; Production (economics); Knowledge production; Regional science; Citation analysis; Computer science; Sociology; Library science; Knowledge management; Economics; Citation,Bibliometrics; Production (economics); Knowledge production; Regional science; Citation analysis; Computer science; Sociology; Library science; Knowledge management; Economics; Citation; Macroeconomics,"Bibliometric methods or ""analysis"" are now firmly established as scientific specialties and are an integral part of research evaluation methodology especially within the scientific and applied fields. The methods are used increasingly when studying various aspects of science and also in the way institutions and universities are ranked worldwide. A sufficient number of studies have been completed, and with the resulting literature, it is now possible to analyse the bibliometric method by using its own methodology. The bibliometric literature in this study, which was extracted from Web of Science, is divided into two parts using a method comparable to the method of Jonkers et al. (Characteristics of bibliometrics articles in library and information sciences (LIS) and other journals, pp. 449-551, 2012: The publications either lie within the Information and Library Science (ILS) category or within the non-ILS category which includes more applied, ""subject"" based studies. The impact in the different groupings is judged by means of citation analysis using normalized data and an almost linear increase can be observed from 1994 onwards in the non-ILS category. The implication for the dissemination and use of the bibliometric methods in the different contexts is discussed. A keyword analysis identifies the most popular subjects covered by bibliometric analysis, and multidisciplinary articles are shown to have the highest impact. A noticeable shift is observed in those countries which contribute to the pool of bibliometric analysis, as well as a self-perpetuating effect in giving and taking references.",,,,,"Ole Ellegaard, 2015, Scientometrics" +OPENALEX,W1965746216,10.1016/j.ijpe.2015.01.003,,Green supply chain management: A review and bibliometric analysis,International Journal of Production Economics,,2015,review,en,2058,Behnam Fahimnia; Joseph Sarkis; Hoda Davarzani,Behnam Fahimnia; Joseph Sarkis; Hoda Davarzani,The University of Sydney; Worcester Polytechnic Institute; The University of Sydney,,,Field (mathematics); Supply chain management; Identification (biology); Bibliometrics; Computer science; Supply chain; Management science; Data science; Systematic review; Data mining; Business; Engineering; Political science; MEDLINE; Marketing,Field (mathematics); Supply chain management; Identification (biology); Bibliometrics; Computer science; Supply chain; Management science; Data science; Systematic review; Data mining; Business; Engineering; Political science; MEDLINE; Marketing; Law; Mathematics; Biology; Pure mathematics; Botany,,,,,,"Behnam Fahimnia, 2015, International Journal of Production Economics" +OPENALEX,W3001491100,10.3145/epi.2020.ene.03,,Software tools for conducting bibliometric analysis in science: An up-to-date review,El Profesional de la Informacion,,2020,article,es,1587,José A. Moral-Muñoz; Enrique Herrera‐Viedma; Antonio Santisteban‐Espejo; Manuel J. Cobo,José A. Moral-Muñoz; Enrique Herrera‐Viedma; Antonio Santisteban‐Espejo; Manuel J. Cobo,Universidad de Cádiz; Universidad de Granada; Hospital Universitario Puerta del Mar; Universidad de Cádiz,,,Bibliometrics; Visualization; Data science; Computer science; Data visualization; Set (abstract data type); Scientometrics; Database; Data mining; World Wide Web,Bibliometrics; Visualization; Data science; Computer science; Data visualization; Set (abstract data type); Scientometrics; Database; Data mining; World Wide Web; Programming language,"Bibliometrics has become an essential tool for assessing and analyzing the output of scientists, cooperation between universities, the effect of state-owned science funding on national research and development performance and educational efficiency, among other applications. Therefore, professionals and scientists need a range of theoretical and practical tools to measure experimental data. This review aims to provide an up-to-date review of the various tools available for conducting bibliometric and scientometric analyses, including the sources of data acquisition, performance analysis and visualization tools. The included tools were divided into three categories: general bibliometric and performance analysis, science mapping analysis, and libraries; a description of all of them is provided. A comparative analysis of the database sources support, pre-processing capabilities, analysis and visualization options were also provided in order to facilitate its understanding. Although there are numerous bibliometric databases to obtain data for bibliometric and scientometric analysis, they have been developed for a different purpose. The number of exportable records is between 500 and 50,000 and the coverage of the different science fields is unequal in each database. Concerning the analyzed tools, Bibliometrix contains the more extensive set of techniques and suitable for practitioners through Biblioshiny. VOSviewer has a fantastic visualization and is capable of loading and exporting information from many sources. SciMAT is the tool with a powerful pre-processing and export capability. In views of the variability of features, the users need to decide the desired analysis output and chose the option that better fits into their aims.",,,,,"José A. Moral-Muñoz, 2020, El Profesional de la Informacion" +OPENALEX,W3044902155,10.1111/ijcs.12605,,Financial literacy: A systematic review and bibliometric analysis,International Journal of Consumer Studies,,2020,review,en,1071,Kirti Goyal; Satish Kumar,Kirti Goyal; Satish Kumar,Malaviya National Institute of Technology Jaipur; Malaviya National Institute of Technology Jaipur,,,Financial literacy; Citation; Content analysis; Citation analysis; Bibliometrics; Literacy; Financial analysis; Accounting; Political science; Sociology; Social science; Business; Library science; Finance; Computer science; Pedagogy,Financial literacy; Citation; Content analysis; Citation analysis; Bibliometrics; Literacy; Financial analysis; Accounting; Political science; Sociology; Social science; Business; Library science; Finance; Computer science; Pedagogy,"Abstract Given the paucity of comprehensive summaries in the extant literature, this systematic review, coupled with bibliometric analysis, endeavours to take a meticulous approach intended at presenting quantitative and qualitative knowledge on the ever‐emerging subject of financial literacy. The study comprises a review of 502 articles ‐ published in peer‐reviewed journals from 2000 to 2019. Citation network, page‐rank analysis, co‐citation analysis, content analysis and publication trends have been employed to identify influential work, delineate the intellectual structure of the field and identify gaps. The most prominent journals, authors, countries, articles and themes have been identified using bibliometric analysis, followed by a comprehensive analysis of the content of 107 papers in the identified clusters. The three major themes enumerated are—levels of financial literacy amongst distinct cohorts, the influence that financial literacy exerts on financial planning and behaviour, and the impact of financial education. Additionally, content analysis of 175 papers has been conducted for the last four years’ articles that were not covered in the co‐citation analysis. Emerging themes identified include financial capability, financial inclusion, gender gap, tax & insurance literacy, and digital financial education. A conceptual framework has been modelled portraying the complete picture, following which potential areas of research have been suggested. This study will help policy‐makers, regulators and academic researchers know the nuts and bolts of financial literacy, and identify the relevant areas that need investigation.",,,,,"Kirti Goyal, 2020, International Journal of Consumer Studies" diff --git a/www/services/bibliometrix_etl/outputs/raw_openalex_records.csv b/www/services/bibliometrix_etl/outputs/raw_openalex_records.csv new file mode 100644 index 000000000..edc590b33 --- /dev/null +++ b/www/services/bibliometrix_etl/outputs/raw_openalex_records.csv @@ -0,0 +1,51 @@ +id,doi,display_name,publication_year,cited_by_count,type,language,abstract,source,journal_abbreviation,authors,author_full_names,affiliations,keywords,concepts +https://openalex.org/W3160856016,https://doi.org/10.1016/j.jbusres.2021.04.070,How to conduct a bibliometric analysis: An overview and guidelines,2021,12082,article,en,,Journal of Business Research,,"['Naveen Donthu', 'Satish Kumar', 'Debmalya Mukherjee', 'Nitesh Pandey', 'Weng Marc Lim']","['Naveen Donthu', 'Satish Kumar', 'Debmalya Mukherjee', 'Nitesh Pandey', 'Weng Marc Lim']","['Georgia State University', 'Malaviya National Institute of Technology Jaipur', 'Swinburne University of Technology Sarawak Campus', 'University of Akron', 'Malaviya National Institute of Technology Jaipur', 'Swinburne University of Technology', 'Swinburne University of Technology Sarawak Campus']","['Bibliometrics', 'Field (mathematics)', 'Data science', 'Resource (disambiguation)', 'Computer science', 'Management science', 'Focus (optics)', 'Library science', 'Engineering', 'Mathematics']","['Bibliometrics', 'Field (mathematics)', 'Data science', 'Resource (disambiguation)', 'Computer science', 'Management science', 'Focus (optics)', 'Library science', 'Engineering', 'Mathematics', 'Computer network', 'Physics', 'Optics', 'Pure mathematics']" +https://openalex.org/W1021000864,https://doi.org/10.1007/s11192-015-1645-z,The bibliometric analysis of scholarly production: How great is the impact?,2015,2987,article,en,"Bibliometric methods or ""analysis"" are now firmly established as scientific specialties and are an integral part of research evaluation methodology especially within the scientific and applied fields. The methods are used increasingly when studying various aspects of science and also in the way institutions and universities are ranked worldwide. A sufficient number of studies have been completed, and with the resulting literature, it is now possible to analyse the bibliometric method by using its own methodology. The bibliometric literature in this study, which was extracted from Web of Science, is divided into two parts using a method comparable to the method of Jonkers et al. (Characteristics of bibliometrics articles in library and information sciences (LIS) and other journals, pp. 449-551, 2012: The publications either lie within the Information and Library Science (ILS) category or within the non-ILS category which includes more applied, ""subject"" based studies. The impact in the different groupings is judged by means of citation analysis using normalized data and an almost linear increase can be observed from 1994 onwards in the non-ILS category. The implication for the dissemination and use of the bibliometric methods in the different contexts is discussed. A keyword analysis identifies the most popular subjects covered by bibliometric analysis, and multidisciplinary articles are shown to have the highest impact. A noticeable shift is observed in those countries which contribute to the pool of bibliometric analysis, as well as a self-perpetuating effect in giving and taking references.",Scientometrics,,"['Ole Ellegaard', 'Johan Albert Wallin']","['Ole Ellegaard', 'Johan Albert Wallin']","['University of Southern Denmark', 'University of Southern Denmark']","['Bibliometrics', 'Production (economics)', 'Knowledge production', 'Regional science', 'Citation analysis', 'Computer science', 'Sociology', 'Library science', 'Knowledge management', 'Economics', 'Citation']","['Bibliometrics', 'Production (economics)', 'Knowledge production', 'Regional science', 'Citation analysis', 'Computer science', 'Sociology', 'Library science', 'Knowledge management', 'Economics', 'Citation', 'Macroeconomics']" +https://openalex.org/W1965746216,https://doi.org/10.1016/j.ijpe.2015.01.003,Green supply chain management: A review and bibliometric analysis,2015,2058,review,en,,International Journal of Production Economics,,"['Behnam Fahimnia', 'Joseph Sarkis', 'Hoda Davarzani']","['Behnam Fahimnia', 'Joseph Sarkis', 'Hoda Davarzani']","['The University of Sydney', 'Worcester Polytechnic Institute', 'The University of Sydney']","['Field (mathematics)', 'Supply chain management', 'Identification (biology)', 'Bibliometrics', 'Computer science', 'Supply chain', 'Management science', 'Data science', 'Systematic review', 'Data mining', 'Business', 'Engineering', 'Political science', 'MEDLINE', 'Marketing']","['Field (mathematics)', 'Supply chain management', 'Identification (biology)', 'Bibliometrics', 'Computer science', 'Supply chain', 'Management science', 'Data science', 'Systematic review', 'Data mining', 'Business', 'Engineering', 'Political science', 'MEDLINE', 'Marketing', 'Law', 'Mathematics', 'Biology', 'Pure mathematics', 'Botany']" +https://openalex.org/W3001491100,https://doi.org/10.3145/epi.2020.ene.03,Software tools for conducting bibliometric analysis in science: An up-to-date review,2020,1587,article,es,"Bibliometrics has become an essential tool for assessing and analyzing the output of scientists, cooperation between universities, the effect of state-owned science funding on national research and development performance and educational efficiency, among other applications. Therefore, professionals and scientists need a range of theoretical and practical tools to measure experimental data. This review aims to provide an up-to-date review of the various tools available for conducting bibliometric and scientometric analyses, including the sources of data acquisition, performance analysis and visualization tools. The included tools were divided into three categories: general bibliometric and performance analysis, science mapping analysis, and libraries; a description of all of them is provided. A comparative analysis of the database sources support, pre-processing capabilities, analysis and visualization options were also provided in order to facilitate its understanding. Although there are numerous bibliometric databases to obtain data for bibliometric and scientometric analysis, they have been developed for a different purpose. The number of exportable records is between 500 and 50,000 and the coverage of the different science fields is unequal in each database. Concerning the analyzed tools, Bibliometrix contains the more extensive set of techniques and suitable for practitioners through Biblioshiny. VOSviewer has a fantastic visualization and is capable of loading and exporting information from many sources. SciMAT is the tool with a powerful pre-processing and export capability. In views of the variability of features, the users need to decide the desired analysis output and chose the option that better fits into their aims.",El Profesional de la Informacion,,"['José A. Moral-Muñoz', 'Enrique Herrera‐Viedma', 'Antonio Santisteban‐Espejo', 'Manuel J. Cobo']","['José A. Moral-Muñoz', 'Enrique Herrera‐Viedma', 'Antonio Santisteban‐Espejo', 'Manuel J. Cobo']","['Universidad de Cádiz', 'Universidad de Granada', 'Hospital Universitario Puerta del Mar', 'Universidad de Cádiz']","['Bibliometrics', 'Visualization', 'Data science', 'Computer science', 'Data visualization', 'Set (abstract data type)', 'Scientometrics', 'Database', 'Data mining', 'World Wide Web']","['Bibliometrics', 'Visualization', 'Data science', 'Computer science', 'Data visualization', 'Set (abstract data type)', 'Scientometrics', 'Database', 'Data mining', 'World Wide Web', 'Programming language']" +https://openalex.org/W3044902155,https://doi.org/10.1111/ijcs.12605,Financial literacy: A systematic review and bibliometric analysis,2020,1071,review,en,"Abstract Given the paucity of comprehensive summaries in the extant literature, this systematic review, coupled with bibliometric analysis, endeavours to take a meticulous approach intended at presenting quantitative and qualitative knowledge on the ever‐emerging subject of financial literacy. The study comprises a review of 502 articles ‐ published in peer‐reviewed journals from 2000 to 2019. Citation network, page‐rank analysis, co‐citation analysis, content analysis and publication trends have been employed to identify influential work, delineate the intellectual structure of the field and identify gaps. The most prominent journals, authors, countries, articles and themes have been identified using bibliometric analysis, followed by a comprehensive analysis of the content of 107 papers in the identified clusters. The three major themes enumerated are—levels of financial literacy amongst distinct cohorts, the influence that financial literacy exerts on financial planning and behaviour, and the impact of financial education. Additionally, content analysis of 175 papers has been conducted for the last four years’ articles that were not covered in the co‐citation analysis. Emerging themes identified include financial capability, financial inclusion, gender gap, tax & insurance literacy, and digital financial education. A conceptual framework has been modelled portraying the complete picture, following which potential areas of research have been suggested. This study will help policy‐makers, regulators and academic researchers know the nuts and bolts of financial literacy, and identify the relevant areas that need investigation.",International Journal of Consumer Studies,,"['Kirti Goyal', 'Satish Kumar']","['Kirti Goyal', 'Satish Kumar']","['Malaviya National Institute of Technology Jaipur', 'Malaviya National Institute of Technology Jaipur']","['Financial literacy', 'Citation', 'Content analysis', 'Citation analysis', 'Bibliometrics', 'Literacy', 'Financial analysis', 'Accounting', 'Political science', 'Sociology', 'Social science', 'Business', 'Library science', 'Finance', 'Computer science', 'Pedagogy']","['Financial literacy', 'Citation', 'Content analysis', 'Citation analysis', 'Bibliometrics', 'Literacy', 'Financial analysis', 'Accounting', 'Political science', 'Sociology', 'Social science', 'Business', 'Library science', 'Finance', 'Computer science', 'Pedagogy']" +https://openalex.org/W4399882939,https://doi.org/10.3390/encyclopedia4020065,Bibliometric Analysis: The Main Steps,2024,608,article,en,"Bibliometric analysis is a systematic study carried out on scientific literature for the identification of patterns, trends, and impact within a certain field. Major steps include data collection from relevant databases, data cleaning and refining, and subjecting data to various bibliometric methods—an ensuing step in the generation of meaningful information. Bibliometric analysis is an increasingly popular and thorough technique for examining and assessing massive amounts of scientific data, which is being used more and more in research. This entry thoroughly introduces bibliometric methodology, emphasizing its numerous methodologies. It also provides a set of reliable, step-by-step instructions for confidently performing bibliometric analysis. Furthermore, we investigate the suitable use of bibliometric analysis as an alternative to systematic literature reviews. This entry aims to be a useful tool for learning about the methods and approaches that may be used to perform research studies that use bibliometric analysis, particularly in the fields of academic study.",Encyclopedia,,['Ioannis Passas'],['Ioannis Passas'],['Hellenic Mediterranean University'],"['Data science', 'Bibliometrics', 'Computer science', 'Field (mathematics)', 'Identification (biology)', 'Citation analysis', 'Scientific literature', 'Management science', 'Information retrieval', 'Data mining', 'Citation', 'Library science', 'Engineering', 'Mathematics']","['Data science', 'Bibliometrics', 'Computer science', 'Field (mathematics)', 'Identification (biology)', 'Citation analysis', 'Scientific literature', 'Management science', 'Information retrieval', 'Data mining', 'Citation', 'Library science', 'Engineering', 'Mathematics', 'Biology', 'Botany', 'Paleontology', 'Pure mathematics']" +https://openalex.org/W1907286193,https://doi.org/10.1002/asi.23329,Growth rates of modern science: A bibliometric analysis based on the number of publications and cited references,2015,1512,article,en,"Many studies (in information science) have looked at the growth of science. In this study, we reexamine the question of the growth of science. To do this we (a) use current data up to publication year 2012 and (b) analyze the data across all disciplines and also separately for the natural sciences and for the medical and health sciences. Furthermore, the data were analyzed with an advanced statistical technique—segmented regression analysis—which can identify specific segments with similar growth rates in the history of science. The study is based on two different sets of bibliometric data: (a) the number of publications held as source items in the Web of Science ( WoS , T homson R euters) per publication year and (b) the number of cited references in the publications of the source items per cited reference year. We looked at the rate at which science has grown since the mid‐1600s. In our analysis of cited references we identified three essential growth phases in the development of science, which each led to growth rates tripling in comparison with the previous phase: from less than 1% up to the middle of the 18th century, to 2 to 3% up to the period between the two world wars, and 8 to 9% to 2010.",Journal of the Association for Information Science and Technology,,"['Lutz Bornmann', 'Rüdiger Mutz']","['Lutz Bornmann', 'Rüdiger Mutz']","['Max Planck Society', 'Max Planck Innovation', 'ETH Zurich']","['Bibliometrics', 'Web of science', 'Natural science', 'Computer science', 'Data science', 'Library science', 'Statistics', 'MEDLINE', 'Mathematics', 'Political science', 'Epistemology', 'Philosophy']","['Bibliometrics', 'Web of science', 'Natural science', 'Computer science', 'Data science', 'Library science', 'Statistics', 'MEDLINE', 'Mathematics', 'Political science', 'Epistemology', 'Philosophy', 'Law']" +https://openalex.org/W2563961554,https://doi.org/10.1016/j.omega.2016.12.004,A bibliometric analysis of operations research and management science,2016,721,article,en,,Omega,,"['José M. Merigó', 'Jianbo Yang']","['José M. Merigó', 'Jianbo Yang']","['University of Manchester', 'University of Chile', 'University of Manchester']","['Web of science', 'Bibliometrics', 'Field (mathematics)', 'Data science', 'Computer science', 'Library science', 'Management science', 'Political science', 'Engineering', 'MEDLINE', 'Mathematics']","['Web of science', 'Bibliometrics', 'Field (mathematics)', 'Data science', 'Computer science', 'Library science', 'Management science', 'Political science', 'Engineering', 'MEDLINE', 'Mathematics', 'Pure mathematics', 'Law']" +https://openalex.org/W2998021954,https://doi.org/10.5530/jscires.8.3.32,Bibliometric Analysis using Bibliometrix an R Package,2020,629,article,en,"This study aims to explore the usage of Open-source software in bibliometric analysis. Biblio-metrix an R package for bibliometric and co-citation analysis was used to achieve the research activities. R is an ecosystem software meaning all functions are shared in an open-source environment with the users. We have used Graphene as a subject of research for bibliometric analysis. Graphene is one of the fastest growing research fields in nanotechnology worldwide. A textual query on Web of Science (WoS) Clarivate Analytics using the term “graphene” was performed retrieving 1155 scholarly papers from 2000 to 2017 with having at least one author based in Turkey. Bibliometric results indicate graphene within nanotechnology as a scientific research field is growing steadily. Graphene not only is used in engineering but also can be used in medical technology. Furthermore, this is an ongoing research exploring an Open-source software and its roles in the field of information studies.",Journal of Scientometric Research,,['Hamid Derviş'],['Hamid Derviş'],[],"['Citation analysis', 'Bibliometrics', 'Computer science', 'Citation', 'Data science', 'Field (mathematics)', 'Subject (documents)', 'Analytics', 'Open source', 'Software', 'Web of science', 'World Wide Web', 'Political science', 'MEDLINE', 'Mathematics']","['Citation analysis', 'Bibliometrics', 'Computer science', 'Citation', 'Data science', 'Field (mathematics)', 'Subject (documents)', 'Analytics', 'Open source', 'Software', 'Web of science', 'World Wide Web', 'Political science', 'MEDLINE', 'Mathematics', 'Programming language', 'Law', 'Pure mathematics']" +https://openalex.org/W1748004804,https://doi.org/10.1016/j.jbusres.2015.10.033,A bibliometric analysis of social entrepreneurship,2015,650,article,en,,Journal of Business Research,,"['Andrea Rey‐Martí', 'Domingo Ribeiro Soriano', 'Daniel Palacios‐Marqués']","['Andrea Rey‐Martí', 'Domingo Ribeiro Soriano', 'Daniel Palacios‐Marqués']","['Universitat de València', 'Universitat de València', 'Universitat Politècnica de València']","['Publication', 'Entrepreneurship', 'Boom', 'Social entrepreneurship', 'Sociology', 'Phenomenon', 'Public relations', 'Social science', 'Political science', 'Business', 'Advertising', 'Engineering']","['Publication', 'Entrepreneurship', 'Boom', 'Social entrepreneurship', 'Sociology', 'Phenomenon', 'Public relations', 'Social science', 'Political science', 'Business', 'Advertising', 'Engineering', 'Law', 'Environmental engineering', 'Quantum mechanics', 'Physics']" +https://openalex.org/W2990450011,https://doi.org/10.1016/j.jbusres.2019.10.039,Forty-five years of Journal of Business Research: A bibliometric analysis,2019,923,article,en,,Journal of Business Research,,"['Naveen Donthu', 'Satish Kumar', 'Debidutta Pattnaik']","['Naveen Donthu', 'Satish Kumar', 'Debidutta Pattnaik']","['Georgia State University', 'Malaviya National Institute of Technology Jaipur', 'Malaviya National Institute of Technology Jaipur']","['Publishing', 'Bibliometrics', 'Empirical research', 'Computer science', 'Library science', 'Political science']","['Publishing', 'Bibliometrics', 'Empirical research', 'Computer science', 'Library science', 'Political science', 'Philosophy', 'Law', 'Epistemology']" +https://openalex.org/W4280610169,https://doi.org/10.1016/j.compag.2022.107017,Drones in agriculture: A review and bibliometric analysis,2022,652,review,en,"Drones, also called Unmanned Aerial Vehicles (UAV), have witnessed a remarkable development in recent decades. In agriculture, they have changed farming practices by offering farmers substantial cost savings, increased operational efficiency, and better profitability. Over the past decades, the topic of agricultural drones has attracted remarkable academic attention. We therefore conduct a comprehensive review based on bibliometrics to summarize and structure existing academic literature and reveal current research trends and hotspots. We apply bibliometric techniques and analyze the literature surrounding agricultural drones to summarize and assess previous research. Our analysis indicates that remote sensing, precision agriculture, deep learning, machine learning, and the Internet of Things are critical topics related to agricultural drones. The co-citation analysis reveals six broad research clusters in the literature. This study is one of the first attempts to summarize drone research in agriculture and suggest future research directions.",Computers and Electronics in Agriculture,,"['Abderahman Rejeb', 'Alireza Abdollahi', 'Karim Rejeb', 'Horst Treiblmaier']","['Abderahman Rejeb', 'Alireza Abdollahi', 'Karim Rejeb', 'Horst Treiblmaier']","['University of Rome Tor Vergata', 'Kharazmi University', 'University of Carthage', 'MODUL University Vienna']","['Drone', 'Bibliometrics', 'Agriculture', 'Citation', 'Data science', 'Precision agriculture', 'Profitability index', 'Computer science', 'Geography', 'Business', 'Library science']","['Drone', 'Bibliometrics', 'Agriculture', 'Citation', 'Data science', 'Precision agriculture', 'Profitability index', 'Computer science', 'Geography', 'Business', 'Library science', 'Archaeology', 'Genetics', 'Finance', 'Biology']" +https://openalex.org/W2747467399,https://doi.org/10.1016/j.ssci.2017.08.011,Bibliometric analysis of safety culture research,2017,593,article,en,"The concept of safety culture is characterised by complexity. On the one hand, the concept is challenging content-wise, and on the other hand, is it a multi-dimensional and cross-disciplinary research domain. In this paper, bibliometric analysis has been applied to the field of safety culture to identify fundamental influences and to obtain a structured overview of the characteristics and the developments in this research domain. In total, 1789 publications published between 1900 and 2015 related to safety culture were identified in Web of Science. The 1789 publications cover 4591 authors, 775 journals, 76 countries or territories, and 1866 institutions. Two main research areas can be distinguished in the domain of safety culture: (1) organisational safety culture and (2) health-care and patient safety culture. The latter research area stands in a dominant position in safety culture research nowadays. Key publications are from Guldenmund (2000) and Sexton et al. (2006). Furthermore, ‘Safety Science’ is the key journal publishing on safety culture research, and the USA, England and China are the countries that dominate the publication production. It can be concluded that there is much collaborative research in the safety culture domain as multi-authored publications make up about three quarters of all publications. Also, safety culture research is characterised by a wide variety of research themes and multidisciplinarity. Geographical inequality in the publication output is identified as a point of concern. A movement away from technical aspects towards more human aspects could be detected as a noteworthy change in research focus.",Safety Science,,"['Karolien van Nunen', 'Jie Li', 'Genserik Reniers', 'Koen Ponnet']","['Karolien van Nunen', 'Jie Li', 'Genserik Reniers', 'Koen Ponnet']","['University of Antwerp', 'Capital University of Economics and Business', 'Delft University of Technology', 'Shanghai Maritime University', 'Delft University of Technology', 'University of Antwerp', 'Ghent University', 'University of Antwerp', 'Antwerp Maritime Academy']","['Safety culture', 'Publishing', 'Multidisciplinary approach', 'China', 'Domain (mathematical analysis)', 'Occupational safety and health', 'Discipline', 'Sociology', 'Engineering ethics', 'Public relations', 'Social science', 'Political science', 'Management', 'Engineering', 'Law']","['Safety culture', 'Publishing', 'Multidisciplinary approach', 'China', 'Domain (mathematical analysis)', 'Occupational safety and health', 'Discipline', 'Sociology', 'Engineering ethics', 'Public relations', 'Social science', 'Political science', 'Management', 'Engineering', 'Law', 'Mathematics', 'Mathematical analysis', 'Economics']" +https://openalex.org/W2263682169,https://doi.org/10.1016/j.knosys.2014.12.035,25years at Knowledge-Based Systems: A bibliometric analysis,2015,572,article,en,,Knowledge-Based Systems,,"['Manuel J. Cobo', 'M. Ángeles Martínez', 'María Gutiérrez-Salcedo', 'Hamido Fujita', 'Enrique Herrera‐Viedma']","['Manuel J. Cobo', 'M. Ángeles Martínez', 'María Gutiérrez-Salcedo', 'Hamido Fujita', 'Enrique Herrera‐Viedma']","['Universidad de Cádiz', 'Universidad Internacional De La Rioja', 'Universidad de Jaén', 'Iwate Prefectural University', 'Universidad de Granada']","['Computer science', 'Bibliometrics', 'Impact factor', 'Data science', 'Information retrieval', 'Library science', 'Political science']","['Computer science', 'Bibliometrics', 'Impact factor', 'Data science', 'Information retrieval', 'Library science', 'Political science', 'Law']" +https://openalex.org/W2600942248,https://doi.org/10.1080/10630732.2017.1285123,The First Two Decades of Smart-City Research: A Bibliometric Analysis,2017,667,article,en,"This paper reports on the first two decades of research on smart cities by conducting a bibliometric analysis of the literature published between 1992 and 2012. The analysis shows that smart-city research is fragmented and lacks cohesion, and its growth follows two main development paths. The first one is based on the peer-reviewed publications produced by European universities, which support a holistic perspective on smart cities. The second path, instead, stands on the gray literature produced by the American business community and relates to a techno-centric understanding of the subject. Divided along such paths, the future development of this new and promising field of research risks being undermined. For while the bibliometric analysis indicates that smart cities are emerging as a fast-growing topic of scientific enquiry, much of the knowledge that is generated about them is singularly technological in nature. In that sense, lacking the social intelligence, cultural artifacts, and environmental attributes, which are needed for the ICT-related urban innovation that such research champions.",Journal of Urban Technology,,"['Luca Mora', 'Roberto Bolici', 'Mark Deakin']","['Luca Mora', 'Roberto Bolici', 'Mark Deakin']","['Politecnico di Milano', 'Politecnico di Milano', 'Edinburgh Napier University']","['Bibliometrics', 'Smart growth', 'Field (mathematics)', 'Smart city', 'Data science', 'Regional science', 'Cohesion (chemistry)', 'Grey literature', 'Knowledge management', 'Political science', 'Sociology', 'Computer science', 'Urban planning', 'Engineering', 'Library science', 'Civil engineering', 'World Wide Web']","['Bibliometrics', 'Smart growth', 'Field (mathematics)', 'Smart city', 'Data science', 'Regional science', 'Cohesion (chemistry)', 'Grey literature', 'Knowledge management', 'Political science', 'Sociology', 'Computer science', 'Urban planning', 'Engineering', 'Library science', 'Civil engineering', 'World Wide Web', 'Mathematics', 'MEDLINE', 'Internet of Things', 'Organic chemistry', 'Chemistry', 'Pure mathematics', 'Law']" +https://openalex.org/W3038273726,https://doi.org/10.1016/j.jbusres.2020.06.057,Investigating the emerging COVID-19 research trends in the field of business and management: A bibliometric analysis approach,2020,1066,article,en,,Journal of Business Research,,"['Surabhi Verma', 'Anders Gustafsson']","['Surabhi Verma', 'Anders Gustafsson']","['University of Southern Denmark', 'BI Norwegian Business School']","['Coronavirus disease 2019 (COVID-19)', 'Bibliometrics', '2019-20 coronavirus outbreak', 'Field (mathematics)', 'Severe acute respiratory syndrome coronavirus 2 (SARS-CoV-2)', 'Data science', 'Regional science', 'Computer science', 'Geography', 'Library science', 'Medicine', 'Virology', 'Mathematics']","['Coronavirus disease 2019 (COVID-19)', 'Bibliometrics', '2019-20 coronavirus outbreak', 'Field (mathematics)', 'Severe acute respiratory syndrome coronavirus 2 (SARS-CoV-2)', 'Data science', 'Regional science', 'Computer science', 'Geography', 'Library science', 'Medicine', 'Virology', 'Mathematics', 'Disease', 'Outbreak', 'Infectious disease (medical specialty)', 'Pathology', 'Pure mathematics']" +https://openalex.org/W2904029666,https://doi.org/10.1016/j.engappai.2018.11.007,Industry 4.0: A bibliometric analysis and detailed overview,2018,544,article,en,,Engineering Applications of Artificial Intelligence,,"['Pranab K. Muhuri', 'Amit K. Shukla', 'Ajith Abraham']","['Pranab K. Muhuri', 'Amit K. Shukla', 'Ajith Abraham']","['South Asian University', 'South Asian University', 'Machine Intelligence Research Labs']","['Computer science', 'Field (mathematics)', 'Bibliometrics', 'Industrial Revolution', 'Automation', 'Data science', 'Citation', 'Citation analysis', 'Subject (documents)', 'Operations research', 'Engineering management', 'Library science']","['Computer science', 'Field (mathematics)', 'Bibliometrics', 'Industrial Revolution', 'Automation', 'Data science', 'Citation', 'Citation analysis', 'Subject (documents)', 'Operations research', 'Engineering management', 'Library science', 'Pure mathematics', 'Mechanical engineering', 'Engineering', 'Mathematics', 'Political science', 'Law']" +https://openalex.org/W2783127227,https://doi.org/10.3390/su10010166,A Bibliometric Analysis and Visualization of Medical Big Data Research,2018,660,article,en,"With the rapid development of “Internet plus”, medical care has entered the era of big data. However, there is little research on medical big data (MBD) from the perspectives of bibliometrics and visualization. The substantive research on the basic aspects of MBD itself is also rare. This study aims to explore the current status of medical big data through visualization analysis on the journal papers related to MBD. We analyze a total of 988 references which were downloaded from the Science Citation Index Expanded and the Social Science Citation Index databases from Web of Science and the time span was defined as “all years”. The GraphPad Prism 5, VOSviewer and CiteSpace softwares are used for analysis. Many results concerning the annual trends, the top players in terms of journal and institute levels, the citations and H-index in terms of country level, the keywords distribution, the highly cited papers, the co-authorship status and the most influential journals and authors are presented in this paper. This study points out the development status and trends on MBD. It can help people in the medical profession to get comprehensive understanding on the state of the art of MBD. It also has reference values for the research and application of the MBD visualization methods.",Sustainability,,"['Huchang Liao', 'Ming Tang', 'Li Luo', 'Chunyang Li', 'Francisco Chiclana', 'Xiao‐Jun Zeng']","['Huchang Liao', 'Ming Tang', 'Li Luo', 'Chunyang Li', 'Francisco Chiclana', 'Xiao‐Jun Zeng']","['Sichuan University', 'Sichuan University', 'Sichuan University', 'West China Medical Center of Sichuan University', 'De Montfort University', 'University of Manchester']","['Bibliometrics', 'Visualization', 'Big data', 'Science Citation Index', 'Citation', 'Data science', 'Web of science', 'Index (typography)', 'Citation analysis', 'Citation index', 'Information visualization', 'Computer science', 'Library science', 'MEDLINE', 'World Wide Web', 'Political science', 'Data mining']","['Bibliometrics', 'Visualization', 'Big data', 'Science Citation Index', 'Citation', 'Data science', 'Web of science', 'Index (typography)', 'Citation analysis', 'Citation index', 'Information visualization', 'Computer science', 'Library science', 'MEDLINE', 'World Wide Web', 'Political science', 'Data mining', 'Law']" +https://openalex.org/W2885251002,https://doi.org/10.1016/j.ijpe.2018.08.003,Supply chain finance: A systematic literature review and bibliometric analysis,2018,730,article,en,,International Journal of Production Economics,,"['Xinhan Xu', 'Xiangfeng Chen', 'Fu Jia', 'Steve Brown', 'Yu Gong', 'Yifan Xu']","['Xinhan Xu', 'Xiangfeng Chen', 'Fu Jia', 'Steve Brown', 'Yu Gong', 'Yifan Xu']","['Fudan University', 'Fudan University', 'University of York', 'University of Southampton', 'University of Southampton', 'Fudan University']","['Trade credit', 'Supply chain', 'Mainstream', 'Payment', 'Systematic review', 'Field (mathematics)', 'Service (business)', 'Computer science', 'Finance', 'Business', 'Marketing', 'Political science']","['Trade credit', 'Supply chain', 'Mainstream', 'Payment', 'Systematic review', 'Field (mathematics)', 'Service (business)', 'Computer science', 'Finance', 'Business', 'Marketing', 'Political science', 'Mathematics', 'Law', 'MEDLINE', 'Pure mathematics']" +https://openalex.org/W2116575643,https://doi.org/10.1007/s11192-005-1523-1,Bibliometric analysis of tsunami research,2007,440,article,en,,Scientometrics,,"['Wen‐Ta Chiu', 'Yuh‐Shan Ho']","['Wen‐Ta Chiu', 'Yuh‐Shan Ho']","['Wan Fang Hospital', 'Taipei Medical University', 'Wan Fang Hospital', 'Taipei Medical University']","['Subject (documents)', 'Distribution (mathematics)', 'Citation', 'Science Citation Index', 'Library science', 'Bibliometrics', 'Citation analysis', 'Statistics', 'History', 'Geography', 'Social science', 'Computer science', 'Sociology', 'Mathematics']","['Subject (documents)', 'Distribution (mathematics)', 'Citation', 'Science Citation Index', 'Library science', 'Bibliometrics', 'Citation analysis', 'Statistics', 'History', 'Geography', 'Social science', 'Computer science', 'Sociology', 'Mathematics', 'Mathematical analysis']" +https://openalex.org/W2165022267,https://doi.org/10.1177/0007650305278086,A Bibliometric Analysis of 30 Years of Research and Theory on Corporate Social Responsibility and Corporate Social Performance,2005,1079,article,en,"Social responsibilities of businesses and their managers have been discussed since the 1950s. Yet no consensus about progress has been achieved in the corporate social responsibility/corporate social performance literature. In this article, we seek to analyze three views on this literature. One view is that development occurred from conceptual vagueness, through clarification of central constructs and their relationships, to the testing of theory—a process supported by increased sophistication in research methods. In contrast, other authors claim that hardly any progress is to be expected because of the inherently normative character of the literature. A final view is that progress in the literature on the social responsibilities of business is obscured or even hampered by the continuing introduction of newconstructs. This article explores which of these three views better describes the evolution of the literature during a period of 30 years and suggests implications for further research.",Business & Society,,"['Frank G. A. de Bakker', 'Peter Groenewegen', 'Frank den Hond']","['Frank G. A. de Bakker', 'Peter Groenewegen', 'Frank den Hond']","['Vrije Universiteit Amsterdam', 'Vrije Universiteit Amsterdam', 'Vrije Universiteit Amsterdam']","['Corporate social responsibility', 'Normative', 'Vagueness', 'Sophistication', 'Sociology', 'Positive economics', 'Social responsibility', 'Process (computing)', 'Stakeholder', 'Public relations', 'Social science', 'Political science', 'Economics']","['Corporate social responsibility', 'Normative', 'Vagueness', 'Sophistication', 'Sociology', 'Positive economics', 'Social responsibility', 'Process (computing)', 'Stakeholder', 'Public relations', 'Social science', 'Political science', 'Economics', 'Operating system', 'Philosophy', 'Law', 'Fuzzy logic', 'Computer science', 'Linguistics']" +https://openalex.org/W3042215340,https://doi.org/10.21037/atm-20-4235,A bibliometric analysis using VOSviewer of publications on COVID-19,2020,547,article,en,"BACKGROUND: As a global pandemic, COVID-19 has aroused great concern in the last few months and a growing number of related researches have been published. Therefore, a bibliometric analysis of these publications may provide a direction of hot topics and future research trends. METHODS: The global literatures about COVID-19 published between 2019 and 2020 were scanned in the Web of Science collection database. ""COVID-19"" ""Novel Coronavirus"" ""2019-nCoV"" and ""SARS-CoV-2"" were used as the keywords to reach the relevant publications. VOSviewer was applied to perform the bibliometric analysis of these articles. RESULTS: Totally 3,626 publications on the topic of COVID-19 were identified and ""COVID-19"" with a total link strength of 2,649 appeared as the most frequent keyword, which had a strong link to ""pneumonia"" and ""epidemiology"". The mean citation count of the top 100 most cited articles was 96 (range, 26-883). Most of them were descriptive studies and concentrated on the clinical features. The highest-ranking journal was British medical journal with 211 publications and the most cited journal was Lancet with 2,485 citation counts. Eleven articles written by Christian Drosten from Berlin Institute of Virology have been cited for 389 times and 40 articles from Chinese Academy of Sciences have been cited for 1,597 times which are the most cited author and organization. The number of collaborators with China is 44 and the total link strength is 487. The main partners of China are USA, England and Germany. The published literatures have focused on three topics: disease management, clinical features and pathogenesis. CONCLUSIONS: The current growth trends predict a large increase in the number of global publications on COVID-19. China made the most outstanding contribution within this important field. Disease treatment, spike protein and vaccine may be hotspots in the future.",Annals of Translational Medicine,,"['Yuetian Yu', 'Yujie Li', 'Zhongheng Zhang', 'Zhi‐Chun Gu', 'Han Zhong', 'Qiongfang Zha', 'Luyu Yang', 'Cheng Zhu', 'Erzhen Chen']","['Yuetian Yu', 'Yujie Li', 'Zhongheng Zhang', 'Zhi‐Chun Gu', 'Han Zhong', 'Qiongfang Zha', 'Luyu Yang', 'Cheng Zhu', 'Erzhen Chen']","['Shanghai Jiao Tong University', 'Shanghai Jiao Tong University', 'Sir Run Run Shaw Hospital', 'Zhejiang University', 'Shanghai Jiao Tong University', 'Shanghai Jiao Tong University', 'Shanghai Jiao Tong University', 'Wuhan Third Hospital', 'Shanghai Jiao Tong University', 'Shanghai Jiao Tong University']","['Citation', 'Coronavirus disease 2019 (COVID-19)', 'Web of science', 'Bibliometrics', 'Library science', 'China', 'Severe acute respiratory syndrome coronavirus 2 (SARS-CoV-2)', 'Pandemic', '2019-20 coronavirus outbreak', 'Scopus', 'MEDLINE', 'Citation analysis', 'Medicine', 'History', 'Political science', 'Computer science', 'Meta-analysis', 'Pathology', 'Disease']","['Citation', 'Coronavirus disease 2019 (COVID-19)', 'Web of science', 'Bibliometrics', 'Library science', 'China', 'Severe acute respiratory syndrome coronavirus 2 (SARS-CoV-2)', 'Pandemic', '2019-20 coronavirus outbreak', 'Scopus', 'MEDLINE', 'Citation analysis', 'Medicine', 'History', 'Political science', 'Computer science', 'Meta-analysis', 'Pathology', 'Disease', 'Archaeology', 'Outbreak', 'Law', 'Infectious disease (medical specialty)']" +https://openalex.org/W3003683721,https://doi.org/10.1111/hir.12295,Application of bibliometrics in medicine: a historical bibliometrics analysis,2020,459,article,en,"BACKGROUND: The application of bibliometrics in medicine enables one to analyse vast amounts of publications and their production patterns on macroscopic and microscopic levels. OBJECTIVES: The aim of the study was to analyse the historical perspective of research literature production regarding application of bibliometrics in medicine. METHODS: Publications related to application of bibliometrics in medicine from 1970 to 2018 were harvested from the Scopus bibliographic database. Reference Publication Year Spectroscopy was triangulated with the VOSViewer to identify historical roots and evolution of topics and clinical areas. RESULTS: The search resulted in 6557 publications. The literature production trend was positive. Historical roots analysis identified 33 historical roots and 16 clinical areas where bibliometrics was applied. DISCUSSION: The increase in productivity in application of bibliometrics in medicine might be attributed to increased use of quantitative metrics in research evaluation, publish or perish phenomenon and the increased use of evidence-based medicine. CONCLUSION: The trend of the literature production was positive. Medicine was in the forefront of knowledge development in bibliometrics. reference publication year spectroscopy proved to be an accurate method which was able to identify most of the historical roots.",Health Information & Libraries Journal,,"['Peter Kokol', 'Helena Blažun Vošner', 'Jernej Završnik']","['Peter Kokol', 'Helena Blažun Vošner', 'Jernej Završnik']","['University of Maribor', 'Zdravstveni dom dr. Adolfa Drolca Maribor', 'Šolski center Slovenj Gradec', 'Zdravstveni dom dr. Adolfa Drolca Maribor']","['Bibliometrics', 'Scopus', 'Trend analysis', 'Data science', 'MEDLINE', 'Library science', 'Computer science', 'Biology']","['Bibliometrics', 'Scopus', 'Trend analysis', 'Data science', 'MEDLINE', 'Library science', 'Computer science', 'Biology', 'Machine learning', 'Biochemistry']" +https://openalex.org/W2915161772,https://doi.org/10.1016/j.frl.2019.02.003,"A bibliometric analysis on green finance: Current status, development, and future directions",2019,640,article,en,,Finance research letters,,"['Dayong Zhang', 'Zhiwei Zhang', 'Shunsuke Managi']","['Dayong Zhang', 'Zhiwei Zhang', 'Shunsuke Managi']","['Southwestern University of Finance and Economics', 'Institute of Economics', 'Institute of Economics', 'Southwestern University of Finance and Economics', 'Kyushu University']","['Status quo', 'Climate Finance', 'Political science', 'Regional science', 'Management science', 'Economics', 'Sociology', 'Economic growth', 'Developing country']","['Status quo', 'Climate Finance', 'Political science', 'Regional science', 'Management science', 'Economics', 'Sociology', 'Economic growth', 'Developing country', 'Law']" +https://openalex.org/W2954472560,https://doi.org/10.3390/su11133606,Bibliometric Analysis on Smart Cities Research,2019,395,article,en,"Smart cities have been a global concern in recent years, involving comprehensive scientific research. To obtain a structural overview and assist researchers in making insights into the characteristics of smart cities research, bibliometric analysis was carried out in this paper. With the application of the bibliometric analysis software VOSviewer and CiteSpace, 4409 smart cities were identified by the core collection of the Web of Science in publications between 1998 and 2019 and used in the analysis of this paper. Concretely, this research visually demonstrates a comprehensive overview of the field relating to smart cities in terms of the production of regular publications, main domain of smart cities researchers, most influential countries (institutions, sources and authors), and interesting research directions in the smart city researches. We also present the research collaboration among countries (regions), organizations and authors based on a series of cooperation analyses. The bibliometric analysis of the existing work provided a valuable and seminal reference for researchers and practitioners in smart cities-related research communities.",Sustainability,,"['Yiming Guo', 'Zhen-Ling Huang', 'Ji Guo', 'Hua Li', 'Xingrong Guo', 'Mpeoane Judith Nkeli']","['Yiming Guo', 'Zhen-Ling Huang', 'Ji Guo', 'Hua Li', 'Xingrong Guo', 'Mpeoane Judith Nkeli']","['Shanghai Maritime University', 'Shanghai Maritime University', 'Shanghai Maritime University', 'Shanghai Maritime University', 'Shanghai Maritime University', 'Shanghai Maritime University']","['Bibliometrics', 'Work (physics)', 'Smart city', 'Field (mathematics)', 'Domain (mathematical analysis)', 'Web of science', 'Data science', 'Regional science', 'Computer science', 'Knowledge management', 'Engineering', 'Geography', 'Political science', 'Library science', 'World Wide Web', 'Internet of Things']","['Bibliometrics', 'Work (physics)', 'Smart city', 'Field (mathematics)', 'Domain (mathematical analysis)', 'Web of science', 'Data science', 'Regional science', 'Computer science', 'Knowledge management', 'Engineering', 'Geography', 'Political science', 'Library science', 'World Wide Web', 'Internet of Things', 'Law', 'Mathematical analysis', 'Mathematics', 'Mechanical engineering', 'Pure mathematics', 'MEDLINE']" +https://openalex.org/W2106572956,https://doi.org/10.1016/j.tourman.2010.07.001,"Publish and perish? Bibliometric analysis, journal ranking and the assessment of research quality in tourism",2010,620,article,en,,Tourism Management,,['C. Michael Hall'],['C. Michael Hall'],"['University of Canterbury', 'Linnaeus University', 'University of Oulu']","['Bibliometrics', 'Journal ranking', 'Scopus', 'Ranking (information retrieval)', 'Tourism', 'Quality (philosophy)', 'Context (archaeology)', 'Publish or perish', 'Citation analysis', 'Government (linguistics)', 'Impact factor', 'Publication', 'Data science', 'Citation', 'Regional science', 'Marketing', 'Political science', 'Computer science', 'Sociology', 'Business', 'Library science', 'Information retrieval', 'Publishing', 'Geography', 'MEDLINE', 'Advertising']","['Bibliometrics', 'Journal ranking', 'Scopus', 'Ranking (information retrieval)', 'Tourism', 'Quality (philosophy)', 'Context (archaeology)', 'Publish or perish', 'Citation analysis', 'Government (linguistics)', 'Impact factor', 'Publication', 'Data science', 'Citation', 'Regional science', 'Marketing', 'Political science', 'Computer science', 'Sociology', 'Business', 'Library science', 'Information retrieval', 'Publishing', 'Geography', 'MEDLINE', 'Advertising', 'Law', 'Linguistics', 'Epistemology', 'Archaeology', 'Philosophy']" +https://openalex.org/W4320070415,https://doi.org/10.1186/s40561-022-00205-x,Is Metaverse in education a blessing or a curse: a combined content and bibliometric analysis,2022,587,article,en,"Abstract The Metaverse has been the centre of attraction for educationists for quite some time. This field got renewed interest with the announcement of social media giant Facebook as it rebranding and positioning it as Meta. While several studies conducted literature reviews to summarize the findings related to the Metaverse in general, no study to the best of our knowledge focused on systematically summarizing the finding related to the Metaverse in education. To cover this gap, this study conducts a systematic literature review of the Metaverse in education. It then applies both content and bibliometric analysis to reveal the research trends, focus, and limitations of this research topic. The obtained findings reveal the research gap in lifelogging applications in educational Metaverse. The findings also show that the design of Metaverse in education has evolved over generations, where generation Z is more targeted with artificial intelligence technologies compared to generation X or Y. In terms of learning scenarios, there have been very few studies focusing on mobile learning, hybrid learning, and micro learning. Additionally, no study focused on using the Metaverse in education for students with disabilities. The findings of this study provide a roadmap of future research directions to be taken into consideration and investigated to enhance the adoption of the Metaverse in education worldwide, as well as to enhance the learning and teaching experiences in the Metaverse.",Smart Learning Environments,,"['Ahmed Tlili', 'Ronghuai Huang', 'Boulus Shehata', 'Dejian Liu', 'Jialu Zhao', 'Ahmed Hosny Saleh Metwally', 'Huanhuan Wang', 'Mouna Denden', 'Aras Bozkurt', 'Lik‐Hang Lee', 'Doğuş Beyoğlu', 'Fahriye Altınay', 'R. C. Sharma', 'Zehra Altınay', 'Zhisheng Li', 'Jiahao Liu', 'Faizan Ahmad', 'Ying Hu', 'Soheil Salha', 'Mourad Abed', 'Daniel Burgos']","['Ahmed Tlili', 'Ronghuai Huang', 'Boulus Shehata', 'Dejian Liu', 'Jialu Zhao', 'Ahmed Hosny Saleh Metwally', 'Huanhuan Wang', 'Mouna Denden', 'Aras Bozkurt', 'Lik‐Hang Lee', 'Doğuş Beyoğlu', 'Fahriye Altınay', 'R. C. Sharma', 'Zehra Altınay', 'Zhisheng Li', 'Jiahao Liu', 'Faizan Ahmad', 'Ying Hu', 'Soheil Salha', 'Mourad Abed', 'Daniel Burgos']","['Beijing Normal University', 'Beijing Normal University', 'Beijing Normal University', 'Beijing Normal University', 'Beijing Normal University', 'Beijing Normal University', 'Beijing Normal University', 'Centre National de la Recherche Scientifique', 'Institut National des Sciences Appliquées de Rennes', ""Laboratoire d'Automatique, de Mécanique et d'Informatique Industrielles et Humaines"", 'INSA Hauts-de-France', 'Université Polytechnique Hauts-de-France', 'Anadolu University', 'University of South Africa', 'Eskişehir City Hospital', 'Korea Advanced Institute of Science and Technology', 'Near East University', 'Near East University', 'Ambedkar University Delhi', 'Near East University', 'Beijing Normal University', 'Beijing Normal University', 'COMSATS University Islamabad', 'Beijing Normal University', 'Beijing Normal University', 'An-Najah National University', 'Centre National de la Recherche Scientifique', 'Institut National des Sciences Appliquées de Rennes', ""Laboratoire d'Automatique, de Mécanique et d'Informatique Industrielles et Humaines"", 'INSA Hauts-de-France', 'Université Polytechnique Hauts-de-France', 'Universidad Internacional De La Rioja']","['Metaverse', 'Computer science', 'Human–computer interaction']","['Metaverse', 'Computer science', 'Human–computer interaction', 'Virtual reality']" +https://openalex.org/W2510091332,https://doi.org/10.1016/j.compedu.2016.03.010,Virtual and remote labs in education: A bibliometric analysis,2016,562,article,en,,Computers & Education,,"['Rubén Heradio', 'Luis de la Torre', 'Daniel Galán', 'Francisco Javier Cabrerizo', 'Enrique Herrera‐Viedma', 'S. Dormido']","['Rubén Heradio', 'Luis de la Torre', 'Daniel Galán', 'Francisco Javier Cabrerizo', 'Enrique Herrera‐Viedma', 'S. Dormido']","['Universidad Nacional de Educación a Distancia', 'Software (Spain)', 'Universidad Nacional de Educación a Distancia', 'Universidad Nacional de Educación a Distancia', 'Universidad Nacional de Educación a Distancia', 'Software (Spain)', 'Universidad de Granada', 'Universidad Nacional de Educación a Distancia']","['Scopus', 'Web of science', 'Computer science', 'Virtual space', 'Space (punctuation)', 'World Wide Web', 'Data science', 'Multimedia', 'MEDLINE', 'Political science', 'Artificial intelligence']","['Scopus', 'Web of science', 'Computer science', 'Virtual space', 'Space (punctuation)', 'World Wide Web', 'Data science', 'Multimedia', 'MEDLINE', 'Political science', 'Artificial intelligence', 'Operating system', 'Law']" +https://openalex.org/W58954717,,How to use Bibexcel for various types of bibliometric analysis,2009,624,article,en,"SOCIETY LAWYERS Contact Us Our Locations California Hawaii Alabama Florida Tips you should follow while hiring an experienced attorney When hiring an attorney, you want to make sure they have a track record of success, past and present. Ask your attorney about the cases he has handled and his track record. Some law firms post",Research at the University of Copenhagen (University of Copenhagen),,"['Olle Persson', 'Rickard Danell', 'Jesper Wiborg Schneider']","['Olle Persson', 'Rickard Danell', 'Jesper Wiborg Schneider']","['Umeå University', 'Umeå University']",['Computer science'],['Computer science'] +https://openalex.org/W3025370095,https://doi.org/10.2196/18228,Artificial Intelligence in Health Care: Bibliometric Analysis,2020,444,article,en,"BACKGROUND: As a critical driving power to promote health care, the health care-related artificial intelligence (AI) literature is growing rapidly. OBJECTIVE: The purpose of this analysis is to provide a dynamic and longitudinal bibliometric analysis of health care-related AI publications. METHODS: The Web of Science (Clarivate PLC) was searched to retrieve all existing and highly cited AI-related health care research papers published in English up to December 2019. Based on bibliometric indicators, a search strategy was developed to screen the title for eligibility, using the abstract and full text where needed. The growth rate of publications, characteristics of research activities, publication patterns, and research hotspot tendencies were computed using the HistCite software. RESULTS: The search identified 5235 hits, of which 1473 publications were included in the analyses. Publication output increased an average of 17.02% per year since 1995, but the growth rate of research papers significantly increased to 45.15% from 2014 to 2019. The major health problems studied in AI research are cancer, depression, Alzheimer disease, heart failure, and diabetes. Artificial neural networks, support vector machines, and convolutional neural networks have the highest impact on health care. Nucleosides, convolutional neural networks, and tumor markers have remained research hotspots through 2019. CONCLUSIONS: This analysis provides a comprehensive overview of the AI-related research conducted in the field of health care, which helps researchers, policy makers, and practitioners better understand the development of health care-related AI research and possible practice implications. Future AI research should be dedicated to filling in the gaps between AI health care research and clinical applications.",Journal of Medical Internet Research,,"['Yuqi Guo', 'Zhichao Hao', 'Shichong Zhao', 'Jiaqi Gong', 'Fan Yang']","['Yuqi Guo', 'Zhichao Hao', 'Shichong Zhao', 'Jiaqi Gong', 'Fan Yang']","['University of North Carolina at Charlotte', 'University of Alabama', 'Dongbei University of Finance and Economics', 'University of Maryland, Baltimore', 'Dongbei University of Finance and Economics']","['Health care', 'Bibliometrics', 'Artificial intelligence', 'MEDLINE', 'Data science', 'Computer science', 'Medicine', 'Data mining', 'Political science']","['Health care', 'Bibliometrics', 'Artificial intelligence', 'MEDLINE', 'Data science', 'Computer science', 'Medicine', 'Data mining', 'Political science', 'Law']" +https://openalex.org/W2886191303,https://doi.org/10.1016/j.techfore.2018.07.006,Knowledge management: A global examination based on bibliometric analysis,2018,537,article,en,,Technological Forecasting and Social Change,,"['Magaly Gaviria-Marín', 'José M. Merigó', 'Hugo Baier-Fuentes']","['Magaly Gaviria-Marín', 'José M. Merigó', 'Hugo Baier-Fuentes']","['Universidad Católica de la Santísima Concepción', 'Universitat de Barcelona', 'University of Chile', 'University of Technology Sydney', 'Universidad Católica de la Santísima Concepción']","['Field (mathematics)', 'Bibliometrics', 'Web of science', 'Computer science', 'Data science', 'Knowledge management', 'Library science', 'Political science', 'MEDLINE']","['Field (mathematics)', 'Bibliometrics', 'Web of science', 'Computer science', 'Data science', 'Knowledge management', 'Library science', 'Political science', 'MEDLINE', 'Mathematics', 'Law', 'Pure mathematics']" +https://openalex.org/W4283591250,https://doi.org/10.1007/s10639-022-11167-5,Systematic literature review and bibliometric analysis on virtual reality and education,2022,523,article,en,"The objective of this study is to identify and analyze the scientific literature with a bibliometric analysis to find the main topics, authors, sources, most cited articles, and countries in the literature on virtual reality in education. Another aim is to understand the conceptual, intellectual, and social structure of the literature on the subject and identify the knowledge base of the use of VR in education and whether it is commonly used and integrated into teaching-learning processes. To do this, articles indexed in the Main Collections of the Web of Science, Scopus and Lens were analyzed for the period 2010 to 2021. The research results are presented in two parts: the first is a quantitative analysis that provides an overview of virtual reality (VR) technology used in the educational field, with tables, graphs, and maps, highlighting the main performance indicators for the production of articles and their citation. The results obtained found a total of 718 articles of which the following were analyzed 273 published articles. The second stage consisted of an inductive type of analysis that found six major groups in the cited articles, which are instruction and learning using VR, VR learning environments, use of VR in different fields of knowledge, learning processes using VR applications or games, learning processes employing simulation, and topics published during the Covid-19 pandemic. Another important aspect to mention is that VR is used in many different areas of education, but until the beginning of the pandemic the use of this so-called ""disruptive process"" came mainly from students, Institutions were reluctant and slow to accept and include VR in the teaching-learning processes.",Education and Information Technologies,,"['Mario Rojas Sánchez', 'Pedro R. Palos‐Sánchez', 'José Antonio Folgado-Fernández']","['Mario Rojas Sánchez', 'Pedro R. Palos‐Sánchez', 'José Antonio Folgado-Fernández']","['Instituto Tecnológico de Costa Rica', 'University of Beira Interior', 'Universidad de Sevilla', 'Universidad de Extremadura']","['Virtual reality', 'Computer science', 'Scopus', 'Subject (documents)', 'Bibliometrics', 'Instructional simulation', 'Educational technology', 'Process (computing)', 'Citation', 'Scientific literature', 'Content analysis', 'Data science', 'Mathematics education', 'World Wide Web', 'Psychology', 'Social science', 'Sociology', 'Human–computer interaction']","['Virtual reality', 'Computer science', 'Scopus', 'Subject (documents)', 'Bibliometrics', 'Instructional simulation', 'Educational technology', 'Process (computing)', 'Citation', 'Scientific literature', 'Content analysis', 'Data science', 'Mathematics education', 'World Wide Web', 'Psychology', 'Social science', 'Sociology', 'Human–computer interaction', 'Paleontology', 'Biology', 'Operating system', 'MEDLINE', 'Political science', 'Law']" +https://openalex.org/W2990688366,https://doi.org/10.1016/j.jbusres.2019.11.025,"A bibliometric analysis of board diversity: Current status, development, and future research directions",2019,601,article,en,,Journal of Business Research,,"['H. Kent Baker', 'Nitesh Pandey', 'Satish Kumar', 'Arunima Haldar']","['H. Kent Baker', 'Nitesh Pandey', 'Satish Kumar', 'Arunima Haldar']","['American University', 'Malaviya National Institute of Technology Jaipur', 'Malaviya National Institute of Technology Jaipur']","['Diversity (politics)', 'Nationality', 'Ethnic group', 'Bibliometrics', 'Field (mathematics)', 'Gender diversity', 'Political science', 'Psychology', 'Library science', 'Immigration', 'Computer science', 'Corporate governance', 'Business']","['Diversity (politics)', 'Nationality', 'Ethnic group', 'Bibliometrics', 'Field (mathematics)', 'Gender diversity', 'Political science', 'Psychology', 'Library science', 'Immigration', 'Computer science', 'Corporate governance', 'Business', 'Law', 'Pure mathematics', 'Mathematics', 'Finance']" +https://openalex.org/W2592517713,https://doi.org/10.1016/j.ibusrev.2017.02.007,Bibliometric analysis of absorptive capacity,2017,351,article,en,,International Business Review,,"['Indri Dwi Apriliyanti', 'Ilan Alon']","['Indri Dwi Apriliyanti', 'Ilan Alon']","['Universitas Gadjah Mada', 'University of Agder', 'University of Agder']","['Absorptive capacity', 'Categorization', 'Citation', 'Knowledge management', 'Knowledge transfer', 'Bibliometrics', 'Computer science', 'Data science', 'Sociology', 'Library science', 'Artificial intelligence']","['Absorptive capacity', 'Categorization', 'Citation', 'Knowledge management', 'Knowledge transfer', 'Bibliometrics', 'Computer science', 'Data science', 'Sociology', 'Library science', 'Artificial intelligence']" +https://openalex.org/W4401785934,https://doi.org/10.38124/ijisrt/ijisrt23nov2413,"A Bibliometric Analysis of Heart Disease Detection using Artificial Intelligence Techniques: Trends, Influential Works, and Research Gaps",2023,777,article,en,"Advanced diagnostic techniques are required as cardiovascular diseases continue to pose a serious threat to global health. The scientific community has recently shown a great deal of interest in the application of deep learning techniques to the detection of heart disease. In order to synthesize the body of research on the use of deep learning in the detection of heart disease, this study provides a thorough bibliometric analysis. A wide variety of publications, including articles, conference papers, and reviews, are included in the analysis. These were obtained from Scopus and WoS databases. Total 662 documents are analyzed from these databases. The study looks at geographic distributions, historical trends, and influential figures in the field. We uncover key papers and authors through quantitative analyses, providing insight into the way research themes have changed over time. The study delves into co-authorship networks and institutional collaborations, offering valuable perspectives on the collaborative environment among scholars operating within this field. To find popular terms and hot topics, keyword analysis is used, which helps to provide a more sophisticated understanding of the main ideas guiding the research that is being done today.",International Journal of Innovative Science and Research Technology (IJISRT),,"['Akshat Kotadia', 'Bhavy Masalia', 'Om Mehra', 'Lakshin Pathak']","['Akshat Kotadia', 'Bhavy Masalia', 'Om Mehra', 'Lakshin Pathak']",[],"['Artificial intelligence', 'Computer science', 'Data science']","['Artificial intelligence', 'Computer science', 'Data science']" +https://openalex.org/W4385494672,https://doi.org/10.1002/joe.22229,Guidelines for interpreting the results of bibliometric analysis: A sensemaking approach,2023,369,article,en,"Abstract While bibliometric analysis is inherently quantitative and objective, it necessitates interpretation, thereby introducing an element of subjectivity. This article proposes a sensemaking approach that transitions researchers from mere description to proactive interpretation of bibliometric results, transforming raw information into informed insights. We discuss the applicability of sensemaking in bibliometric analysis and offer practical guidelines for its integration into systematic literature reviews. These guidelines revolve around a three‐stage sensemaking process—that is, scanning, sensing, and substantiating—each crucial to deriving meaningful interpretations. As such, this article serves as a valuable guide for researchers seeking to utilize bibliometric analysis as a potent analytical tool in their review studies.",Global Business and Organizational Excellence,,"['Weng Marc Lim', 'Satish Kumar']","['Weng Marc Lim', 'Satish Kumar']","['Swinburne University of Technology', 'Sunway University', 'Swinburne University of Technology Sarawak Campus', 'Indian Institute of Management Ahmedabad', 'Sunway University']","['Sensemaking', 'Interpretation (philosophy)', 'Process (computing)', 'Management science', 'Computer science', 'Subjectivity', 'Data science', 'Raw data', 'Epistemology', 'Knowledge management', 'Engineering']","['Sensemaking', 'Interpretation (philosophy)', 'Process (computing)', 'Management science', 'Computer science', 'Subjectivity', 'Data science', 'Raw data', 'Epistemology', 'Knowledge management', 'Engineering', 'Philosophy', 'Operating system', 'Programming language']" +https://openalex.org/W2576786802,https://doi.org/10.1016/j.jik.2016.12.002,An overview of qualitative comparative analysis: A bibliometric analysis,2017,384,article,en,"This study is organized in two parts. We conduct a general analysis of the use of qualitative comparative analysis (QCA), and a bibliometric study of the use of QCA to analyze the specificities of the research publications that apply this methodology. Our results show the differences in quantitative terms of the three variants of this methodology: fsQCA, csQCA, and mvQCA.",Journal of Innovation & Knowledge,,"['Norat Roig‐Tierno', 'Tomas F. Gonzalez-Cruz', 'Jordi Llopis-Martinez']","['Norat Roig‐Tierno', 'Tomas F. Gonzalez-Cruz', 'Jordi Llopis-Martinez']","['Valencian International University', 'Universitat de València', 'Universitat de València']","['Qualitative comparative analysis', 'Humanities', 'Qualitative analysis', 'Qualitative research', 'Sociology', 'Mathematics', 'Philosophy', 'Social science', 'Statistics']","['Qualitative comparative analysis', 'Humanities', 'Qualitative analysis', 'Qualitative research', 'Sociology', 'Mathematics', 'Philosophy', 'Social science', 'Statistics']" +https://openalex.org/W2919854756,https://doi.org/10.3390/su11051377,Tourism Research on Sustainability: A Bibliometric Analysis,2019,356,article,en,"Tourism represents one of the main industries in terms of job creation and economic development while sustainability in tourism represents a worldwide challenge. The objective of the present study is to use a bibliometric approach to review the relevant literature. Bibliometric indicators, such as citations, are used to identify the field structure and the VOSviewer software is used to map the main trends in this area. Over the period 1987–2018, a total of 4647 papers were found in Scopus regarding sustainability issues in tourism. Analysis of the leading journals, authors, institutions, and keywords indicates that: (1) the literature on sustainability issues in the field of tourism is significantly growing; (2) a mere six papers accounted more than 300 citations, but there are several prolific authors; (3) of the 614 sources included in the review, the most important have published 46.7% of the papers; (4) in terms of documents and citations, the United States is the leading country in this topic; (5) according to keyword trend network analysis, sustainability is becoming a strategic approach for companies and tourist destinations. Finally, this subfield within the tourism literature has considerable potential and is expected to continue growing.",Sustainability,,"['Àngels Niñerola', 'María Victòria Sánchez Rebull', 'Ana Beatriz Hernández‐Lara']","['Àngels Niñerola', 'María Victòria Sánchez Rebull', 'Ana Beatriz Hernández‐Lara']","['Universitat Rovira i Virgili', 'Universitat Rovira i Virgili', 'Universitat Rovira i Virgili']","['Scopus', 'Sustainability', 'Tourism', 'Bibliometrics', 'Destinations', 'Regional science', 'Business', 'Geography', 'Marketing', 'Political science', 'Computer science', 'Library science', 'MEDLINE']","['Scopus', 'Sustainability', 'Tourism', 'Bibliometrics', 'Destinations', 'Regional science', 'Business', 'Geography', 'Marketing', 'Political science', 'Computer science', 'Library science', 'MEDLINE', 'Archaeology', 'Biology', 'Law', 'Ecology']" +https://openalex.org/W2150220236,https://doi.org/10.1007/s11192-009-0146-3,"Software survey: VOSviewer, a computer program for bibliometric mapping",2009,19703,article,en,"We present VOSviewer, a freely available computer program that we have developed for constructing and viewing bibliometric maps. Unlike most computer programs that are used for bibliometric mapping, VOSviewer pays special attention to the graphical representation of bibliometric maps. The functionality of VOSviewer is especially useful for displaying large bibliometric maps in an easy-to-interpret way. The paper consists of three parts. In the first part, an overview of VOSviewer's functionality for displaying bibliometric maps is provided. In the second part, the technical implementation of specific parts of the program is discussed. Finally, in the third part, VOSviewer's ability to handle large maps is demonstrated by using the program to construct and display a co-citation map of 5,000 major scientific journals.",Scientometrics,,"['Nees Jan van Eck', 'Ludo Waltman']","['Nees Jan van Eck', 'Ludo Waltman']","['Leiden University', 'Erasmus University Rotterdam', 'Leiden University', 'Erasmus University Rotterdam']","['Computer science', 'Construct (python library)', 'Bibliometrics', 'Citation', 'Software', 'Representation (politics)', 'Data science', 'World Wide Web']","['Computer science', 'Construct (python library)', 'Bibliometrics', 'Citation', 'Software', 'Representation (politics)', 'Data science', 'World Wide Web', 'Law', 'Political science', 'Politics', 'Programming language']" +https://openalex.org/W2785537869,https://doi.org/10.1108/ejm-11-2017-0853,Fifty years of the European Journal of Marketing: a bibliometric analysis,2018,550,article,en,"Purpose The European Journal of Marketing was created in 1967. In 2017, the journal celebrates its 50th anniversary. Therefore, the purpose of this study is to present a bibliometric overview of the leading trends of the journal during this period. Design/methodology/approach This work uses the Scopus database to analyse the most productive authors, institutions and countries, as well as the most cited papers and the citing articles. The investigation uses bibliometric indicators to represent the bibliographic data, including the total number of publications and citations between 1967 and 2017. Additionally, the article also develops a graphical visualization of the bibliographic material by using the visualization of similarities viewer software to map journals, keywords and institutions with bibliographic coupling and co-citation analysis. Findings British authors and institutions are the most productive in the journal, although Australians’ are growing significantly the number of papers published. Continental European institutions are also increasing the number of publications, but they are still far from reaching the British contribution so far. In the mid-term, however, these zone’s authors and institutions, especially those from big European countries like France, Germany, Italy and Spain, should reach a closer performance to British ones; more as less long, historic, but more recent periods of analysis are considered. Practical implications This article is useful for any reader of this journal to understand questions such as papers’ European Journal of Marketing -related scientific productivity in terms of, for instance, contributors/authors, institutions and countries, or the main sources used to back them. Originality/value This is the first comprehensive article offering a general overview of the leading trends and researchers of the journal over its history.",European Journal of Marketing,,"['Francisco J. Martínez‐López', 'José M. Merigó', 'Leslier Valenzuela‐Fernández', 'Carolina Nicolás']","['Francisco J. Martínez‐López', 'José M. Merigó', 'Leslier Valenzuela‐Fernández', 'Carolina Nicolás']","['Universidad de Granada', 'EAE Business School', 'University of Chile', 'University of Chile', 'Universidad Santo Tomás']","['Scopus', 'Originality', 'Bibliographic coupling', 'Citation', 'Bibliometrics', 'Library science', 'Productivity', 'Bibliographic database', 'European commission', 'Citation analysis', 'Impact factor', 'Regional science', 'Political science', 'Social science', 'Sociology', 'European union', 'Computer science', 'Business', 'Economics', 'MEDLINE', 'Economic growth', 'Law']","['Scopus', 'Originality', 'Bibliographic coupling', 'Citation', 'Bibliometrics', 'Library science', 'Productivity', 'Bibliographic database', 'European commission', 'Citation analysis', 'Impact factor', 'Regional science', 'Political science', 'Social science', 'Sociology', 'European union', 'Computer science', 'Business', 'Economics', 'MEDLINE', 'Economic growth', 'Law', 'Qualitative research', 'Economic policy']" +https://openalex.org/W2981634144,https://doi.org/10.3791/58494,"Comparing Bibliometric Analysis Using PubMed, Scopus, and Web of Science Databases",2019,491,article,en,"Literature databases (i.e., PubMed, Scopus, and Web of Science) differ in terms of their coverage, focus, and the tool they provide. PubMed focuses mainly on life sciences and biomedical disciplines, whereas Scopus and Web of Science are multidisciplinary. The protocol described in the current study was used to search for publications from Jordanian authors in the years 2013-2017. In this protocol, how to use each database to conduct this type of search is explained in detail. A Scopus search resulted in the highest number of documents (11,444 documents), followed by a Web of Science search (10,943 documents). PubMed resulted in a smaller number of documents due to its narrower scope and coverage (4,363 documents). The results also show a yearly trend in: (1) the number of publications, (2) the disciplines that have the most publications, (3) the countries of collaboration, and (4) the number of open access publications. In contrast, PubMed has a sophisticated keyword optimization service (i.e., Medical Subject Heading, or MeSH), while both Scopus and Web of Science provide search analysis tools that can produce representative figures. Finally, the features of each database are explained in detail and several indices that can be extracted using the search results are provided. This study provides a base for using literature databases for bibliometric analysis.",Journal of Visualized Experiments,,"['Saif Aldeen AlRyalat', 'Lna Malkawi', 'Shaher Momani']","['Saif Aldeen AlRyalat', 'Lna Malkawi', 'Shaher Momani']","['University of Jordan', 'Yahoo (Spain)', 'University of Jordan', 'University of Jordan', 'Northwest African American Museum', 'King Abdulaziz University']","['Scopus', 'Web of science', 'Computer science', 'Subject (documents)', 'Scope (computer science)', 'Bibliometrics', 'Information retrieval', 'Multidisciplinary approach', 'Database', 'MEDLINE', 'Bibliographic database', 'Protocol (science)', 'World Wide Web', 'Data science', 'Medicine', 'Political science']","['Scopus', 'Web of science', 'Computer science', 'Subject (documents)', 'Scope (computer science)', 'Bibliometrics', 'Information retrieval', 'Multidisciplinary approach', 'Database', 'MEDLINE', 'Bibliographic database', 'Protocol (science)', 'World Wide Web', 'Data science', 'Medicine', 'Political science', 'Alternative medicine', 'Law', 'Programming language', 'Pathology']" +https://openalex.org/W2191867853,https://doi.org/10.1016/j.jbusres.2015.10.054,A bibliometric analysis of international impact of business incubators,2015,343,article,en,,Journal of Business Research,,"['Gema Albort-Morant', 'Domingo Ribeiro Soriano']","['Gema Albort-Morant', 'Domingo Ribeiro Soriano']","['Universitat de València', 'Universitat de València']","['Bibliometrics', 'Productivity', 'Web of science', 'Cover (algebra)', 'Regional science', 'Library science', 'Business', 'Political science', 'Computer science', 'Sociology', 'Economics', 'Engineering', 'Economic growth', 'MEDLINE']","['Bibliometrics', 'Productivity', 'Web of science', 'Cover (algebra)', 'Regional science', 'Library science', 'Business', 'Political science', 'Computer science', 'Sociology', 'Economics', 'Engineering', 'Economic growth', 'MEDLINE', 'Law', 'Mechanical engineering']" +https://openalex.org/W2793000158,https://doi.org/10.1016/j.jbusres.2017.12.054,A bibliometric analysis of born global firms,2018,304,article,en,,Journal of Business Research,,['Piotr Dzikowski'],['Piotr Dzikowski'],['University of Zielona Góra'],"['Citation', 'Citation analysis', 'Bibliometrics', 'Productivity', 'Web of science', 'Regional science', 'Library science', 'Political science', 'Sociology', 'Economics', 'Computer science', 'Economic growth', 'MEDLINE', 'Law']","['Citation', 'Citation analysis', 'Bibliometrics', 'Productivity', 'Web of science', 'Regional science', 'Library science', 'Political science', 'Sociology', 'Economics', 'Computer science', 'Economic growth', 'MEDLINE', 'Law']" +https://openalex.org/W2610818236,https://doi.org/10.1016/j.jclepro.2017.05.018,Corporate social responsibility for supply chain management: A literature review and bibliometric analysis,2017,495,review,en,,Journal of Cleaner Production,,"['Yunting Feng', 'Qinghua Zhu', 'Kee‐hung Lai']","['Yunting Feng', 'Qinghua Zhu', 'Kee‐hung Lai']","['Shanghai Jiao Tong University', 'Shanghai Jiao Tong University', 'Hong Kong Polytechnic University']","['Corporate social responsibility', 'Stakeholder', 'Normative', 'Social network analysis', 'Supply chain', 'Knowledge management', 'Supply chain management', 'Citation analysis', 'Business', 'Citation', 'Field (mathematics)', 'Sociology', 'Management science', 'Computer science', 'Political science', 'Marketing', 'Public relations', 'Engineering', 'Social science']","['Corporate social responsibility', 'Stakeholder', 'Normative', 'Social network analysis', 'Supply chain', 'Knowledge management', 'Supply chain management', 'Citation analysis', 'Business', 'Citation', 'Field (mathematics)', 'Sociology', 'Management science', 'Computer science', 'Political science', 'Marketing', 'Public relations', 'Engineering', 'Social science', 'Law', 'Social capital', 'Pure mathematics', 'Mathematics', 'World Wide Web']" +https://openalex.org/W2072689080,https://doi.org/10.1080/09669582.2014.978790,Trends and patterns in sustainable tourism research: a 25-year bibliometric analysis,2015,439,article,en,"In the quarter of a century since the release of the 1987 Brundtland Report, sustainable tourism has emerged as the dominant paradigm in tourism development. However, the debate, discourse, and criticism of this subfield of tourism research continues. To address such concerns the purpose of this paper is to explore trends and patterns in sustainable tourism research over the past 25 years. A 25-year bibliometric analysis was conducted for the four highest ranked journals in the tourism field. Results indicate that the growth in sustainable tourism research has been remarkable, with 492 papers published in these four journals and almost half of these in the last two years of the analysis. The largest proportion of papers published on sustainable tourism was case studies, empirical studies, and critical reviews. This study found that while the theoretical and methodological approaches appear to have matured over time, the subjects and themes in sustainable tourism research, with some exceptions, have remained constant. However, the field is clearly maturing with a move away from definitional and conceptual papers to papers focused on testing and applying theory through empirical research.",Journal of Sustainable Tourism,,"['Lisa Ruhanen', 'Betty Weiler', 'Brent Moyle', 'Char-lee McLennan']","['Lisa Ruhanen', 'Betty Weiler', 'Brent Moyle', 'Char-lee McLennan']","['University of Queensland', 'Southern Cross University', 'Southern Cross University', 'Griffith University']","['Tourism', 'Sustainable tourism', 'Regional science', 'Bibliometrics', 'Empirical research', 'Tourism geography', 'Sustainable development', 'Criticism', 'Sustainability', 'Social science', 'Political science', 'Sociology', 'Library science', 'Epistemology']","['Tourism', 'Sustainable tourism', 'Regional science', 'Bibliometrics', 'Empirical research', 'Tourism geography', 'Sustainable development', 'Criticism', 'Sustainability', 'Social science', 'Political science', 'Sociology', 'Library science', 'Epistemology', 'Ecology', 'Computer science', 'Biology', 'Philosophy', 'Law']" +https://openalex.org/W3125707221,https://doi.org/10.1177/1094428114562629,Bibliometric Methods in Management and Organization,2014,6624,article,en,"We aim to develop a meaningful single-source reference for management and organization scholars interested in using bibliometric methods for mapping research specialties. Such methods introduce a measure of objectivity into the evaluation of scientific literature and hold the potential to increase rigor and mitigate researcher bias in reviews of scientific literature by aggregating the opinions of multiple scholars working in the field. We introduce the bibliometric methods of citation analysis, co-citation analysis, bibliographical coupling, co-author analysis, and co-word analysis and present a workflow for conducting bibliometric studies with guidelines for researchers. We envision that bibliometric methods will complement meta-analysis and qualitative structured literature reviews as a method for reviewing and evaluating scientific literature. To demonstrate bibliometric methods, we performed a citation and co-citation analysis to map the intellectual structure of the Organizational Research Methods journal.",Organizational Research Methods,,"['Ivan Župič', 'Tomaž Čater']","['Ivan Župič', 'Tomaž Čater']","['University of Ljubljana', 'University of Ljubljana']","['Bibliographic coupling', 'Citation analysis', 'Citation', 'Objectivity (philosophy)', 'Bibliometrics', 'Workflow', 'Computer science', 'Co-citation', 'Data science', 'Field (mathematics)', 'Management science', 'Sociology', 'Knowledge management', 'Library science', 'Epistemology', 'Database', 'Engineering']","['Bibliographic coupling', 'Citation analysis', 'Citation', 'Objectivity (philosophy)', 'Bibliometrics', 'Workflow', 'Computer science', 'Co-citation', 'Data science', 'Field (mathematics)', 'Management science', 'Sociology', 'Knowledge management', 'Library science', 'Epistemology', 'Database', 'Engineering', 'Mathematics', 'Philosophy', 'Pure mathematics']" +https://openalex.org/W3198357836,https://doi.org/10.1016/j.jbef.2021.100577,"Artificial intelligence and machine learning in finance: Identifying foundations, themes, and research clusters from bibliometric analysis",2021,665,article,en,,Journal of Behavioral and Experimental Finance,,"['John W. Goodell', 'Satish Kumar', 'Weng Marc Lim', 'Debidutta Pattnaik']","['John W. Goodell', 'Satish Kumar', 'Weng Marc Lim', 'Debidutta Pattnaik']","['University of Akron', 'Malaviya National Institute of Technology Jaipur', 'Swinburne University of Technology Sarawak Campus', 'Swinburne University of Technology Sarawak Campus', 'Woxsen School of Business', 'Malaviya National Institute of Technology Jaipur']","['Scholarship', 'Bibliographic coupling', 'Valuation (finance)', 'Corporate finance', 'Finance', 'Citation', 'Portfolio', 'Artificial intelligence', 'Sociology', 'Economics', 'Computer science', 'Library science']","['Scholarship', 'Bibliographic coupling', 'Valuation (finance)', 'Corporate finance', 'Finance', 'Citation', 'Portfolio', 'Artificial intelligence', 'Sociology', 'Economics', 'Computer science', 'Library science', 'Economic growth']" +https://openalex.org/W1743190515,https://doi.org/10.1007/s11192-015-1747-7,Economics in Latin America: a bibliometric analysis,2015,346,article,en,,Scientometrics,,"['Claudio A. Bonilla', 'José M. Merigó', 'Carolina Torres-Abad']","['Claudio A. Bonilla', 'José M. Merigó', 'Carolina Torres-Abad']","['University of Chile', 'University of Chile', 'University of Chile']","['Bibliometrics', 'Latin Americans', 'Web of science', 'Per capita', 'Regional science', 'Scientometrics', 'Scopus', 'Order (exchange)', 'Library science', 'Political science', 'Geography', 'Economics', 'Demography', 'Sociology', 'MEDLINE', 'Computer science', 'Population']","['Bibliometrics', 'Latin Americans', 'Web of science', 'Per capita', 'Regional science', 'Scientometrics', 'Scopus', 'Order (exchange)', 'Library science', 'Political science', 'Geography', 'Economics', 'Demography', 'Sociology', 'MEDLINE', 'Computer science', 'Population', 'Law', 'Finance']" +https://openalex.org/W3183627559,https://doi.org/10.1016/j.jbusres.2021.07.015,Mapping the electronic word-of-mouth (eWOM) research: A systematic review and bibliometric analysis,2021,455,review,en,,Journal of Business Research,,"['Naveen Donthu', 'Satish Kumar', 'Neeraj Pandey', 'Nitesh Pandey', 'Akanksha Mishra']","['Naveen Donthu', 'Satish Kumar', 'Neeraj Pandey', 'Nitesh Pandey', 'Akanksha Mishra']","['Georgia State University', 'Swinburne University of Technology Sarawak Campus', 'Malaviya National Institute of Technology Jaipur', 'National Institute of Industrial Engineering', 'Malaviya National Institute of Technology Jaipur', 'National Institute of Industrial Engineering']","['Word of mouth', 'Hospitality', 'Social media', 'Service (business)', 'Loyalty', 'Marketing', 'Field (mathematics)', 'Focus (optics)', 'Tourism', 'Content analysis', 'Advertising', 'Sociology', 'Business', 'Psychology', 'Computer science', 'Political science', 'World Wide Web', 'Social science']","['Word of mouth', 'Hospitality', 'Social media', 'Service (business)', 'Loyalty', 'Marketing', 'Field (mathematics)', 'Focus (optics)', 'Tourism', 'Content analysis', 'Advertising', 'Sociology', 'Business', 'Psychology', 'Computer science', 'Political science', 'World Wide Web', 'Social science', 'Law', 'Pure mathematics', 'Physics', 'Optics', 'Mathematics']" +https://openalex.org/W2943541748,https://doi.org/10.1016/j.cities.2019.04.015,Neighbourhood walkability: A review and bibliometric analysis,2019,290,review,en,,Cities,,"['Hao Wang', 'Yuqi Yang']","['Hao Wang', 'Yuqi Yang']","['Central University of Finance and Economics', 'Central University of Finance and Economics']","['Walkability', 'Neighbourhood (mathematics)', 'Built environment', 'Geography', 'Transport engineering', 'Environmental planning', 'Environmental health', 'Civil engineering', 'Medicine', 'Engineering']","['Walkability', 'Neighbourhood (mathematics)', 'Built environment', 'Geography', 'Transport engineering', 'Environmental planning', 'Environmental health', 'Civil engineering', 'Medicine', 'Engineering', 'Mathematics', 'Mathematical analysis']" diff --git a/www/services/bibliometrix_etl/outputs/scopus_first_5_normalized_rows.csv b/www/services/bibliometrix_etl/outputs/scopus_first_5_normalized_rows.csv new file mode 100644 index 000000000..8c0277eee --- /dev/null +++ b/www/services/bibliometrix_etl/outputs/scopus_first_5_normalized_rows.csv @@ -0,0 +1,4 @@ +DB,UT,DI,PMID,TI,SO,JI,PY,DT,LA,TC,AU,AF,C1,RP,CR,DE,ID,AB,VL,IS,BP,EP,SR +SCOPUS,SCOPUS-ID-001,10.1000/sample1,,Bibliometric Analysis of Artificial Intelligence Research,Journal of Data Science,,2024,Article,English,15,Smith J.; Rahman A.,"Smith, John; Rahman, Ahmed",Nanjing University of Information Science and Technology; University of Dhaka,,Reference A; Reference B; Reference C,bibliometrics; artificial intelligence; research trends,data science; scientometrics,This study analyzes artificial intelligence research using bibliometric methods.,12,2,101,115,"Smith J., 2024, Journal of Data Science" +SCOPUS,SCOPUS-ID-002,10.1000/sample2,,OpenAlex Data Standardization for Bibliometrix Python,Scientometrics Review,,2023,Conference Paper,English,9,Chen L.; Karim M.,"Chen, Li; Karim, Mohammad",Nanjing University of Information Science and Technology,,Reference X; Reference Y,OpenAlex; ETL; bibliometrix; Python,metadata; data pipeline,This paper discusses data standardization challenges in Python bibliometric tools.,8,1,55,70,"Chen L., 2023, Scientometrics Review" +SCOPUS,SCOPUS-ID-003,10.1000/sample3,,A Source-Agnostic ETL Pipeline for Bibliographic Data,International Journal of Information Systems,,2022,Article,English,22,Lee K.; Hasan R.,"Lee, Kim; Hasan, Rakib",University of Malaya; Nanjing University of Information Science and Technology,,Reference M; Reference N; Reference O,ETL; bibliographic data; data transformation,information systems; metadata conversion,The study proposes an ETL pipeline for heterogeneous bibliographic data sources.,15,4,201,220,"Lee K., 2022, International Journal of Information Systems" diff --git a/www/services/bibliometrix_etl/outputs/standardized_openalex_api.csv b/www/services/bibliometrix_etl/outputs/standardized_openalex_api.csv new file mode 100644 index 000000000..a06bc0fd2 --- /dev/null +++ b/www/services/bibliometrix_etl/outputs/standardized_openalex_api.csv @@ -0,0 +1,51 @@ +DB,UT,DI,PMID,TI,SO,JI,PY,DT,LA,TC,AU,AF,C1,RP,CR,DE,ID,AB,VL,IS,BP,EP,SR +OPENALEX,W3160856016,10.1016/j.jbusres.2021.04.070,,How to conduct a bibliometric analysis: An overview and guidelines,Journal of Business Research,,2021,article,en,12082,Naveen Donthu; Satish Kumar; Debmalya Mukherjee; Nitesh Pandey; Weng Marc Lim,Naveen Donthu; Satish Kumar; Debmalya Mukherjee; Nitesh Pandey; Weng Marc Lim,Georgia State University; Malaviya National Institute of Technology Jaipur; Swinburne University of Technology Sarawak Campus; University of Akron; Malaviya National Institute of Technology Jaipur; Swinburne University of Technology; Swinburne University of Technology Sarawak Campus,,,Bibliometrics; Field (mathematics); Data science; Resource (disambiguation); Computer science; Management science; Focus (optics); Library science; Engineering; Mathematics,Bibliometrics; Field (mathematics); Data science; Resource (disambiguation); Computer science; Management science; Focus (optics); Library science; Engineering; Mathematics; Computer network; Physics; Optics; Pure mathematics,,,,,,"Naveen Donthu, 2021, Journal of Business Research" +OPENALEX,W1021000864,10.1007/s11192-015-1645-z,,The bibliometric analysis of scholarly production: How great is the impact?,Scientometrics,,2015,article,en,2987,Ole Ellegaard; Johan Albert Wallin,Ole Ellegaard; Johan Albert Wallin,University of Southern Denmark; University of Southern Denmark,,,Bibliometrics; Production (economics); Knowledge production; Regional science; Citation analysis; Computer science; Sociology; Library science; Knowledge management; Economics; Citation,Bibliometrics; Production (economics); Knowledge production; Regional science; Citation analysis; Computer science; Sociology; Library science; Knowledge management; Economics; Citation; Macroeconomics,"Bibliometric methods or ""analysis"" are now firmly established as scientific specialties and are an integral part of research evaluation methodology especially within the scientific and applied fields. The methods are used increasingly when studying various aspects of science and also in the way institutions and universities are ranked worldwide. A sufficient number of studies have been completed, and with the resulting literature, it is now possible to analyse the bibliometric method by using its own methodology. The bibliometric literature in this study, which was extracted from Web of Science, is divided into two parts using a method comparable to the method of Jonkers et al. (Characteristics of bibliometrics articles in library and information sciences (LIS) and other journals, pp. 449-551, 2012: The publications either lie within the Information and Library Science (ILS) category or within the non-ILS category which includes more applied, ""subject"" based studies. The impact in the different groupings is judged by means of citation analysis using normalized data and an almost linear increase can be observed from 1994 onwards in the non-ILS category. The implication for the dissemination and use of the bibliometric methods in the different contexts is discussed. A keyword analysis identifies the most popular subjects covered by bibliometric analysis, and multidisciplinary articles are shown to have the highest impact. A noticeable shift is observed in those countries which contribute to the pool of bibliometric analysis, as well as a self-perpetuating effect in giving and taking references.",,,,,"Ole Ellegaard, 2015, Scientometrics" +OPENALEX,W1965746216,10.1016/j.ijpe.2015.01.003,,Green supply chain management: A review and bibliometric analysis,International Journal of Production Economics,,2015,review,en,2058,Behnam Fahimnia; Joseph Sarkis; Hoda Davarzani,Behnam Fahimnia; Joseph Sarkis; Hoda Davarzani,The University of Sydney; Worcester Polytechnic Institute; The University of Sydney,,,Field (mathematics); Supply chain management; Identification (biology); Bibliometrics; Computer science; Supply chain; Management science; Data science; Systematic review; Data mining; Business; Engineering; Political science; MEDLINE; Marketing,Field (mathematics); Supply chain management; Identification (biology); Bibliometrics; Computer science; Supply chain; Management science; Data science; Systematic review; Data mining; Business; Engineering; Political science; MEDLINE; Marketing; Law; Mathematics; Biology; Pure mathematics; Botany,,,,,,"Behnam Fahimnia, 2015, International Journal of Production Economics" +OPENALEX,W3001491100,10.3145/epi.2020.ene.03,,Software tools for conducting bibliometric analysis in science: An up-to-date review,El Profesional de la Informacion,,2020,article,es,1587,José A. Moral-Muñoz; Enrique Herrera‐Viedma; Antonio Santisteban‐Espejo; Manuel J. Cobo,José A. Moral-Muñoz; Enrique Herrera‐Viedma; Antonio Santisteban‐Espejo; Manuel J. Cobo,Universidad de Cádiz; Universidad de Granada; Hospital Universitario Puerta del Mar; Universidad de Cádiz,,,Bibliometrics; Visualization; Data science; Computer science; Data visualization; Set (abstract data type); Scientometrics; Database; Data mining; World Wide Web,Bibliometrics; Visualization; Data science; Computer science; Data visualization; Set (abstract data type); Scientometrics; Database; Data mining; World Wide Web; Programming language,"Bibliometrics has become an essential tool for assessing and analyzing the output of scientists, cooperation between universities, the effect of state-owned science funding on national research and development performance and educational efficiency, among other applications. Therefore, professionals and scientists need a range of theoretical and practical tools to measure experimental data. This review aims to provide an up-to-date review of the various tools available for conducting bibliometric and scientometric analyses, including the sources of data acquisition, performance analysis and visualization tools. The included tools were divided into three categories: general bibliometric and performance analysis, science mapping analysis, and libraries; a description of all of them is provided. A comparative analysis of the database sources support, pre-processing capabilities, analysis and visualization options were also provided in order to facilitate its understanding. Although there are numerous bibliometric databases to obtain data for bibliometric and scientometric analysis, they have been developed for a different purpose. The number of exportable records is between 500 and 50,000 and the coverage of the different science fields is unequal in each database. Concerning the analyzed tools, Bibliometrix contains the more extensive set of techniques and suitable for practitioners through Biblioshiny. VOSviewer has a fantastic visualization and is capable of loading and exporting information from many sources. SciMAT is the tool with a powerful pre-processing and export capability. In views of the variability of features, the users need to decide the desired analysis output and chose the option that better fits into their aims.",,,,,"José A. Moral-Muñoz, 2020, El Profesional de la Informacion" +OPENALEX,W3044902155,10.1111/ijcs.12605,,Financial literacy: A systematic review and bibliometric analysis,International Journal of Consumer Studies,,2020,review,en,1071,Kirti Goyal; Satish Kumar,Kirti Goyal; Satish Kumar,Malaviya National Institute of Technology Jaipur; Malaviya National Institute of Technology Jaipur,,,Financial literacy; Citation; Content analysis; Citation analysis; Bibliometrics; Literacy; Financial analysis; Accounting; Political science; Sociology; Social science; Business; Library science; Finance; Computer science; Pedagogy,Financial literacy; Citation; Content analysis; Citation analysis; Bibliometrics; Literacy; Financial analysis; Accounting; Political science; Sociology; Social science; Business; Library science; Finance; Computer science; Pedagogy,"Abstract Given the paucity of comprehensive summaries in the extant literature, this systematic review, coupled with bibliometric analysis, endeavours to take a meticulous approach intended at presenting quantitative and qualitative knowledge on the ever‐emerging subject of financial literacy. The study comprises a review of 502 articles ‐ published in peer‐reviewed journals from 2000 to 2019. Citation network, page‐rank analysis, co‐citation analysis, content analysis and publication trends have been employed to identify influential work, delineate the intellectual structure of the field and identify gaps. The most prominent journals, authors, countries, articles and themes have been identified using bibliometric analysis, followed by a comprehensive analysis of the content of 107 papers in the identified clusters. The three major themes enumerated are—levels of financial literacy amongst distinct cohorts, the influence that financial literacy exerts on financial planning and behaviour, and the impact of financial education. Additionally, content analysis of 175 papers has been conducted for the last four years’ articles that were not covered in the co‐citation analysis. Emerging themes identified include financial capability, financial inclusion, gender gap, tax & insurance literacy, and digital financial education. A conceptual framework has been modelled portraying the complete picture, following which potential areas of research have been suggested. This study will help policy‐makers, regulators and academic researchers know the nuts and bolts of financial literacy, and identify the relevant areas that need investigation.",,,,,"Kirti Goyal, 2020, International Journal of Consumer Studies" +OPENALEX,W4399882939,10.3390/encyclopedia4020065,,Bibliometric Analysis: The Main Steps,Encyclopedia,,2024,article,en,608,Ioannis Passas,Ioannis Passas,Hellenic Mediterranean University,,,Data science; Bibliometrics; Computer science; Field (mathematics); Identification (biology); Citation analysis; Scientific literature; Management science; Information retrieval; Data mining; Citation; Library science; Engineering; Mathematics,Data science; Bibliometrics; Computer science; Field (mathematics); Identification (biology); Citation analysis; Scientific literature; Management science; Information retrieval; Data mining; Citation; Library science; Engineering; Mathematics; Biology; Botany; Paleontology; Pure mathematics,"Bibliometric analysis is a systematic study carried out on scientific literature for the identification of patterns, trends, and impact within a certain field. Major steps include data collection from relevant databases, data cleaning and refining, and subjecting data to various bibliometric methods—an ensuing step in the generation of meaningful information. Bibliometric analysis is an increasingly popular and thorough technique for examining and assessing massive amounts of scientific data, which is being used more and more in research. This entry thoroughly introduces bibliometric methodology, emphasizing its numerous methodologies. It also provides a set of reliable, step-by-step instructions for confidently performing bibliometric analysis. Furthermore, we investigate the suitable use of bibliometric analysis as an alternative to systematic literature reviews. This entry aims to be a useful tool for learning about the methods and approaches that may be used to perform research studies that use bibliometric analysis, particularly in the fields of academic study.",,,,,"Ioannis Passas, 2024, Encyclopedia" +OPENALEX,W1907286193,10.1002/asi.23329,,Growth rates of modern science: A bibliometric analysis based on the number of publications and cited references,Journal of the Association for Information Science and Technology,,2015,article,en,1512,Lutz Bornmann; Rüdiger Mutz,Lutz Bornmann; Rüdiger Mutz,Max Planck Society; Max Planck Innovation; ETH Zurich,,,Bibliometrics; Web of science; Natural science; Computer science; Data science; Library science; Statistics; MEDLINE; Mathematics; Political science; Epistemology; Philosophy,Bibliometrics; Web of science; Natural science; Computer science; Data science; Library science; Statistics; MEDLINE; Mathematics; Political science; Epistemology; Philosophy; Law,"Many studies (in information science) have looked at the growth of science. In this study, we reexamine the question of the growth of science. To do this we (a) use current data up to publication year 2012 and (b) analyze the data across all disciplines and also separately for the natural sciences and for the medical and health sciences. Furthermore, the data were analyzed with an advanced statistical technique—segmented regression analysis—which can identify specific segments with similar growth rates in the history of science. The study is based on two different sets of bibliometric data: (a) the number of publications held as source items in the Web of Science ( WoS , T homson R euters) per publication year and (b) the number of cited references in the publications of the source items per cited reference year. We looked at the rate at which science has grown since the mid‐1600s. In our analysis of cited references we identified three essential growth phases in the development of science, which each led to growth rates tripling in comparison with the previous phase: from less than 1% up to the middle of the 18th century, to 2 to 3% up to the period between the two world wars, and 8 to 9% to 2010.",,,,,"Lutz Bornmann, 2015, Journal of the Association for Information Science and Technology" +OPENALEX,W2563961554,10.1016/j.omega.2016.12.004,,A bibliometric analysis of operations research and management science,Omega,,2016,article,en,721,José M. Merigó; Jianbo Yang,José M. Merigó; Jianbo Yang,University of Manchester; University of Chile; University of Manchester,,,Web of science; Bibliometrics; Field (mathematics); Data science; Computer science; Library science; Management science; Political science; Engineering; MEDLINE; Mathematics,Web of science; Bibliometrics; Field (mathematics); Data science; Computer science; Library science; Management science; Political science; Engineering; MEDLINE; Mathematics; Pure mathematics; Law,,,,,,"José M. Merigó, 2016, Omega" +OPENALEX,W2998021954,10.5530/jscires.8.3.32,,Bibliometric Analysis using Bibliometrix an R Package,Journal of Scientometric Research,,2020,article,en,629,Hamid Derviş,Hamid Derviş,,,,Citation analysis; Bibliometrics; Computer science; Citation; Data science; Field (mathematics); Subject (documents); Analytics; Open source; Software; Web of science; World Wide Web; Political science; MEDLINE; Mathematics,Citation analysis; Bibliometrics; Computer science; Citation; Data science; Field (mathematics); Subject (documents); Analytics; Open source; Software; Web of science; World Wide Web; Political science; MEDLINE; Mathematics; Programming language; Law; Pure mathematics,"This study aims to explore the usage of Open-source software in bibliometric analysis. Biblio-metrix an R package for bibliometric and co-citation analysis was used to achieve the research activities. R is an ecosystem software meaning all functions are shared in an open-source environment with the users. We have used Graphene as a subject of research for bibliometric analysis. Graphene is one of the fastest growing research fields in nanotechnology worldwide. A textual query on Web of Science (WoS) Clarivate Analytics using the term “graphene” was performed retrieving 1155 scholarly papers from 2000 to 2017 with having at least one author based in Turkey. Bibliometric results indicate graphene within nanotechnology as a scientific research field is growing steadily. Graphene not only is used in engineering but also can be used in medical technology. Furthermore, this is an ongoing research exploring an Open-source software and its roles in the field of information studies.",,,,,"Hamid Derviş, 2020, Journal of Scientometric Research" +OPENALEX,W1748004804,10.1016/j.jbusres.2015.10.033,,A bibliometric analysis of social entrepreneurship,Journal of Business Research,,2015,article,en,650,Andrea Rey‐Martí; Domingo Ribeiro Soriano; Daniel Palacios‐Marqués,Andrea Rey‐Martí; Domingo Ribeiro Soriano; Daniel Palacios‐Marqués,Universitat de València; Universitat de València; Universitat Politècnica de València,,,Publication; Entrepreneurship; Boom; Social entrepreneurship; Sociology; Phenomenon; Public relations; Social science; Political science; Business; Advertising; Engineering,Publication; Entrepreneurship; Boom; Social entrepreneurship; Sociology; Phenomenon; Public relations; Social science; Political science; Business; Advertising; Engineering; Law; Environmental engineering; Quantum mechanics; Physics,,,,,,"Andrea Rey‐Martí, 2015, Journal of Business Research" +OPENALEX,W2990450011,10.1016/j.jbusres.2019.10.039,,Forty-five years of Journal of Business Research: A bibliometric analysis,Journal of Business Research,,2019,article,en,923,Naveen Donthu; Satish Kumar; Debidutta Pattnaik,Naveen Donthu; Satish Kumar; Debidutta Pattnaik,Georgia State University; Malaviya National Institute of Technology Jaipur; Malaviya National Institute of Technology Jaipur,,,Publishing; Bibliometrics; Empirical research; Computer science; Library science; Political science,Publishing; Bibliometrics; Empirical research; Computer science; Library science; Political science; Philosophy; Law; Epistemology,,,,,,"Naveen Donthu, 2019, Journal of Business Research" +OPENALEX,W4280610169,10.1016/j.compag.2022.107017,,Drones in agriculture: A review and bibliometric analysis,Computers and Electronics in Agriculture,,2022,review,en,652,Abderahman Rejeb; Alireza Abdollahi; Karim Rejeb; Horst Treiblmaier,Abderahman Rejeb; Alireza Abdollahi; Karim Rejeb; Horst Treiblmaier,University of Rome Tor Vergata; Kharazmi University; University of Carthage; MODUL University Vienna,,,Drone; Bibliometrics; Agriculture; Citation; Data science; Precision agriculture; Profitability index; Computer science; Geography; Business; Library science,Drone; Bibliometrics; Agriculture; Citation; Data science; Precision agriculture; Profitability index; Computer science; Geography; Business; Library science; Archaeology; Genetics; Finance; Biology,"Drones, also called Unmanned Aerial Vehicles (UAV), have witnessed a remarkable development in recent decades. In agriculture, they have changed farming practices by offering farmers substantial cost savings, increased operational efficiency, and better profitability. Over the past decades, the topic of agricultural drones has attracted remarkable academic attention. We therefore conduct a comprehensive review based on bibliometrics to summarize and structure existing academic literature and reveal current research trends and hotspots. We apply bibliometric techniques and analyze the literature surrounding agricultural drones to summarize and assess previous research. Our analysis indicates that remote sensing, precision agriculture, deep learning, machine learning, and the Internet of Things are critical topics related to agricultural drones. The co-citation analysis reveals six broad research clusters in the literature. This study is one of the first attempts to summarize drone research in agriculture and suggest future research directions.",,,,,"Abderahman Rejeb, 2022, Computers and Electronics in Agriculture" +OPENALEX,W2747467399,10.1016/j.ssci.2017.08.011,,Bibliometric analysis of safety culture research,Safety Science,,2017,article,en,593,Karolien van Nunen; Jie Li; Genserik Reniers; Koen Ponnet,Karolien van Nunen; Jie Li; Genserik Reniers; Koen Ponnet,University of Antwerp; Capital University of Economics and Business; Delft University of Technology; Shanghai Maritime University; Delft University of Technology; University of Antwerp; Ghent University; University of Antwerp; Antwerp Maritime Academy,,,Safety culture; Publishing; Multidisciplinary approach; China; Domain (mathematical analysis); Occupational safety and health; Discipline; Sociology; Engineering ethics; Public relations; Social science; Political science; Management; Engineering; Law,Safety culture; Publishing; Multidisciplinary approach; China; Domain (mathematical analysis); Occupational safety and health; Discipline; Sociology; Engineering ethics; Public relations; Social science; Political science; Management; Engineering; Law; Mathematics; Mathematical analysis; Economics,"The concept of safety culture is characterised by complexity. On the one hand, the concept is challenging content-wise, and on the other hand, is it a multi-dimensional and cross-disciplinary research domain. In this paper, bibliometric analysis has been applied to the field of safety culture to identify fundamental influences and to obtain a structured overview of the characteristics and the developments in this research domain. In total, 1789 publications published between 1900 and 2015 related to safety culture were identified in Web of Science. The 1789 publications cover 4591 authors, 775 journals, 76 countries or territories, and 1866 institutions. Two main research areas can be distinguished in the domain of safety culture: (1) organisational safety culture and (2) health-care and patient safety culture. The latter research area stands in a dominant position in safety culture research nowadays. Key publications are from Guldenmund (2000) and Sexton et al. (2006). Furthermore, ‘Safety Science’ is the key journal publishing on safety culture research, and the USA, England and China are the countries that dominate the publication production. It can be concluded that there is much collaborative research in the safety culture domain as multi-authored publications make up about three quarters of all publications. Also, safety culture research is characterised by a wide variety of research themes and multidisciplinarity. Geographical inequality in the publication output is identified as a point of concern. A movement away from technical aspects towards more human aspects could be detected as a noteworthy change in research focus.",,,,,"Karolien van Nunen, 2017, Safety Science" +OPENALEX,W2263682169,10.1016/j.knosys.2014.12.035,,25years at Knowledge-Based Systems: A bibliometric analysis,Knowledge-Based Systems,,2015,article,en,572,Manuel J. Cobo; M. Ángeles Martínez; María Gutiérrez-Salcedo; Hamido Fujita; Enrique Herrera‐Viedma,Manuel J. Cobo; M. Ángeles Martínez; María Gutiérrez-Salcedo; Hamido Fujita; Enrique Herrera‐Viedma,Universidad de Cádiz; Universidad Internacional De La Rioja; Universidad de Jaén; Iwate Prefectural University; Universidad de Granada,,,Computer science; Bibliometrics; Impact factor; Data science; Information retrieval; Library science; Political science,Computer science; Bibliometrics; Impact factor; Data science; Information retrieval; Library science; Political science; Law,,,,,,"Manuel J. Cobo, 2015, Knowledge-Based Systems" +OPENALEX,W2600942248,10.1080/10630732.2017.1285123,,The First Two Decades of Smart-City Research: A Bibliometric Analysis,Journal of Urban Technology,,2017,article,en,667,Luca Mora; Roberto Bolici; Mark Deakin,Luca Mora; Roberto Bolici; Mark Deakin,Politecnico di Milano; Politecnico di Milano; Edinburgh Napier University,,,Bibliometrics; Smart growth; Field (mathematics); Smart city; Data science; Regional science; Cohesion (chemistry); Grey literature; Knowledge management; Political science; Sociology; Computer science; Urban planning; Engineering; Library science; Civil engineering; World Wide Web,Bibliometrics; Smart growth; Field (mathematics); Smart city; Data science; Regional science; Cohesion (chemistry); Grey literature; Knowledge management; Political science; Sociology; Computer science; Urban planning; Engineering; Library science; Civil engineering; World Wide Web; Mathematics; MEDLINE; Internet of Things; Organic chemistry; Chemistry; Pure mathematics; Law,"This paper reports on the first two decades of research on smart cities by conducting a bibliometric analysis of the literature published between 1992 and 2012. The analysis shows that smart-city research is fragmented and lacks cohesion, and its growth follows two main development paths. The first one is based on the peer-reviewed publications produced by European universities, which support a holistic perspective on smart cities. The second path, instead, stands on the gray literature produced by the American business community and relates to a techno-centric understanding of the subject. Divided along such paths, the future development of this new and promising field of research risks being undermined. For while the bibliometric analysis indicates that smart cities are emerging as a fast-growing topic of scientific enquiry, much of the knowledge that is generated about them is singularly technological in nature. In that sense, lacking the social intelligence, cultural artifacts, and environmental attributes, which are needed for the ICT-related urban innovation that such research champions.",,,,,"Luca Mora, 2017, Journal of Urban Technology" +OPENALEX,W3038273726,10.1016/j.jbusres.2020.06.057,,Investigating the emerging COVID-19 research trends in the field of business and management: A bibliometric analysis approach,Journal of Business Research,,2020,article,en,1066,Surabhi Verma; Anders Gustafsson,Surabhi Verma; Anders Gustafsson,University of Southern Denmark; BI Norwegian Business School,,,Coronavirus disease 2019 (COVID-19); Bibliometrics; 2019-20 coronavirus outbreak; Field (mathematics); Severe acute respiratory syndrome coronavirus 2 (SARS-CoV-2); Data science; Regional science; Computer science; Geography; Library science; Medicine; Virology; Mathematics,Coronavirus disease 2019 (COVID-19); Bibliometrics; 2019-20 coronavirus outbreak; Field (mathematics); Severe acute respiratory syndrome coronavirus 2 (SARS-CoV-2); Data science; Regional science; Computer science; Geography; Library science; Medicine; Virology; Mathematics; Disease; Outbreak; Infectious disease (medical specialty); Pathology; Pure mathematics,,,,,,"Surabhi Verma, 2020, Journal of Business Research" +OPENALEX,W2904029666,10.1016/j.engappai.2018.11.007,,Industry 4.0: A bibliometric analysis and detailed overview,Engineering Applications of Artificial Intelligence,,2018,article,en,544,Pranab K. Muhuri; Amit K. Shukla; Ajith Abraham,Pranab K. Muhuri; Amit K. Shukla; Ajith Abraham,South Asian University; South Asian University; Machine Intelligence Research Labs,,,Computer science; Field (mathematics); Bibliometrics; Industrial Revolution; Automation; Data science; Citation; Citation analysis; Subject (documents); Operations research; Engineering management; Library science,Computer science; Field (mathematics); Bibliometrics; Industrial Revolution; Automation; Data science; Citation; Citation analysis; Subject (documents); Operations research; Engineering management; Library science; Pure mathematics; Mechanical engineering; Engineering; Mathematics; Political science; Law,,,,,,"Pranab K. Muhuri, 2018, Engineering Applications of Artificial Intelligence" +OPENALEX,W2783127227,10.3390/su10010166,,A Bibliometric Analysis and Visualization of Medical Big Data Research,Sustainability,,2018,article,en,660,Huchang Liao; Ming Tang; Li Luo; Chunyang Li; Francisco Chiclana; Xiao‐Jun Zeng,Huchang Liao; Ming Tang; Li Luo; Chunyang Li; Francisco Chiclana; Xiao‐Jun Zeng,Sichuan University; Sichuan University; Sichuan University; West China Medical Center of Sichuan University; De Montfort University; University of Manchester,,,Bibliometrics; Visualization; Big data; Science Citation Index; Citation; Data science; Web of science; Index (typography); Citation analysis; Citation index; Information visualization; Computer science; Library science; MEDLINE; World Wide Web; Political science; Data mining,Bibliometrics; Visualization; Big data; Science Citation Index; Citation; Data science; Web of science; Index (typography); Citation analysis; Citation index; Information visualization; Computer science; Library science; MEDLINE; World Wide Web; Political science; Data mining; Law,"With the rapid development of “Internet plus”, medical care has entered the era of big data. However, there is little research on medical big data (MBD) from the perspectives of bibliometrics and visualization. The substantive research on the basic aspects of MBD itself is also rare. This study aims to explore the current status of medical big data through visualization analysis on the journal papers related to MBD. We analyze a total of 988 references which were downloaded from the Science Citation Index Expanded and the Social Science Citation Index databases from Web of Science and the time span was defined as “all years”. The GraphPad Prism 5, VOSviewer and CiteSpace softwares are used for analysis. Many results concerning the annual trends, the top players in terms of journal and institute levels, the citations and H-index in terms of country level, the keywords distribution, the highly cited papers, the co-authorship status and the most influential journals and authors are presented in this paper. This study points out the development status and trends on MBD. It can help people in the medical profession to get comprehensive understanding on the state of the art of MBD. It also has reference values for the research and application of the MBD visualization methods.",,,,,"Huchang Liao, 2018, Sustainability" +OPENALEX,W2885251002,10.1016/j.ijpe.2018.08.003,,Supply chain finance: A systematic literature review and bibliometric analysis,International Journal of Production Economics,,2018,article,en,730,Xinhan Xu; Xiangfeng Chen; Fu Jia; Steve Brown; Yu Gong; Yifan Xu,Xinhan Xu; Xiangfeng Chen; Fu Jia; Steve Brown; Yu Gong; Yifan Xu,Fudan University; Fudan University; University of York; University of Southampton; University of Southampton; Fudan University,,,Trade credit; Supply chain; Mainstream; Payment; Systematic review; Field (mathematics); Service (business); Computer science; Finance; Business; Marketing; Political science,Trade credit; Supply chain; Mainstream; Payment; Systematic review; Field (mathematics); Service (business); Computer science; Finance; Business; Marketing; Political science; Mathematics; Law; MEDLINE; Pure mathematics,,,,,,"Xinhan Xu, 2018, International Journal of Production Economics" +OPENALEX,W2116575643,10.1007/s11192-005-1523-1,,Bibliometric analysis of tsunami research,Scientometrics,,2007,article,en,440,Wen‐Ta Chiu; Yuh‐Shan Ho,Wen‐Ta Chiu; Yuh‐Shan Ho,Wan Fang Hospital; Taipei Medical University; Wan Fang Hospital; Taipei Medical University,,,Subject (documents); Distribution (mathematics); Citation; Science Citation Index; Library science; Bibliometrics; Citation analysis; Statistics; History; Geography; Social science; Computer science; Sociology; Mathematics,Subject (documents); Distribution (mathematics); Citation; Science Citation Index; Library science; Bibliometrics; Citation analysis; Statistics; History; Geography; Social science; Computer science; Sociology; Mathematics; Mathematical analysis,,,,,,"Wen‐Ta Chiu, 2007, Scientometrics" +OPENALEX,W2165022267,10.1177/0007650305278086,,A Bibliometric Analysis of 30 Years of Research and Theory on Corporate Social Responsibility and Corporate Social Performance,Business & Society,,2005,article,en,1079,Frank G. A. de Bakker; Peter Groenewegen; Frank den Hond,Frank G. A. de Bakker; Peter Groenewegen; Frank den Hond,Vrije Universiteit Amsterdam; Vrije Universiteit Amsterdam; Vrije Universiteit Amsterdam,,,Corporate social responsibility; Normative; Vagueness; Sophistication; Sociology; Positive economics; Social responsibility; Process (computing); Stakeholder; Public relations; Social science; Political science; Economics,Corporate social responsibility; Normative; Vagueness; Sophistication; Sociology; Positive economics; Social responsibility; Process (computing); Stakeholder; Public relations; Social science; Political science; Economics; Operating system; Philosophy; Law; Fuzzy logic; Computer science; Linguistics,"Social responsibilities of businesses and their managers have been discussed since the 1950s. Yet no consensus about progress has been achieved in the corporate social responsibility/corporate social performance literature. In this article, we seek to analyze three views on this literature. One view is that development occurred from conceptual vagueness, through clarification of central constructs and their relationships, to the testing of theory—a process supported by increased sophistication in research methods. In contrast, other authors claim that hardly any progress is to be expected because of the inherently normative character of the literature. A final view is that progress in the literature on the social responsibilities of business is obscured or even hampered by the continuing introduction of newconstructs. This article explores which of these three views better describes the evolution of the literature during a period of 30 years and suggests implications for further research.",,,,,"Frank G. A. de Bakker, 2005, Business & Society" +OPENALEX,W3042215340,10.21037/atm-20-4235,,A bibliometric analysis using VOSviewer of publications on COVID-19,Annals of Translational Medicine,,2020,article,en,547,Yuetian Yu; Yujie Li; Zhongheng Zhang; Zhi‐Chun Gu; Han Zhong; Qiongfang Zha; Luyu Yang; Cheng Zhu; Erzhen Chen,Yuetian Yu; Yujie Li; Zhongheng Zhang; Zhi‐Chun Gu; Han Zhong; Qiongfang Zha; Luyu Yang; Cheng Zhu; Erzhen Chen,Shanghai Jiao Tong University; Shanghai Jiao Tong University; Sir Run Run Shaw Hospital; Zhejiang University; Shanghai Jiao Tong University; Shanghai Jiao Tong University; Shanghai Jiao Tong University; Wuhan Third Hospital; Shanghai Jiao Tong University; Shanghai Jiao Tong University,,,Citation; Coronavirus disease 2019 (COVID-19); Web of science; Bibliometrics; Library science; China; Severe acute respiratory syndrome coronavirus 2 (SARS-CoV-2); Pandemic; 2019-20 coronavirus outbreak; Scopus; MEDLINE; Citation analysis; Medicine; History; Political science; Computer science; Meta-analysis; Pathology; Disease,Citation; Coronavirus disease 2019 (COVID-19); Web of science; Bibliometrics; Library science; China; Severe acute respiratory syndrome coronavirus 2 (SARS-CoV-2); Pandemic; 2019-20 coronavirus outbreak; Scopus; MEDLINE; Citation analysis; Medicine; History; Political science; Computer science; Meta-analysis; Pathology; Disease; Archaeology; Outbreak; Law; Infectious disease (medical specialty),"BACKGROUND: As a global pandemic, COVID-19 has aroused great concern in the last few months and a growing number of related researches have been published. Therefore, a bibliometric analysis of these publications may provide a direction of hot topics and future research trends. METHODS: The global literatures about COVID-19 published between 2019 and 2020 were scanned in the Web of Science collection database. ""COVID-19"" ""Novel Coronavirus"" ""2019-nCoV"" and ""SARS-CoV-2"" were used as the keywords to reach the relevant publications. VOSviewer was applied to perform the bibliometric analysis of these articles. RESULTS: Totally 3,626 publications on the topic of COVID-19 were identified and ""COVID-19"" with a total link strength of 2,649 appeared as the most frequent keyword, which had a strong link to ""pneumonia"" and ""epidemiology"". The mean citation count of the top 100 most cited articles was 96 (range, 26-883). Most of them were descriptive studies and concentrated on the clinical features. The highest-ranking journal was British medical journal with 211 publications and the most cited journal was Lancet with 2,485 citation counts. Eleven articles written by Christian Drosten from Berlin Institute of Virology have been cited for 389 times and 40 articles from Chinese Academy of Sciences have been cited for 1,597 times which are the most cited author and organization. The number of collaborators with China is 44 and the total link strength is 487. The main partners of China are USA, England and Germany. The published literatures have focused on three topics: disease management, clinical features and pathogenesis. CONCLUSIONS: The current growth trends predict a large increase in the number of global publications on COVID-19. China made the most outstanding contribution within this important field. Disease treatment, spike protein and vaccine may be hotspots in the future.",,,,,"Yuetian Yu, 2020, Annals of Translational Medicine" +OPENALEX,W3003683721,10.1111/hir.12295,,Application of bibliometrics in medicine: a historical bibliometrics analysis,Health Information & Libraries Journal,,2020,article,en,459,Peter Kokol; Helena Blažun Vošner; Jernej Završnik,Peter Kokol; Helena Blažun Vošner; Jernej Završnik,University of Maribor; Zdravstveni dom dr. Adolfa Drolca Maribor; Šolski center Slovenj Gradec; Zdravstveni dom dr. Adolfa Drolca Maribor,,,Bibliometrics; Scopus; Trend analysis; Data science; MEDLINE; Library science; Computer science; Biology,Bibliometrics; Scopus; Trend analysis; Data science; MEDLINE; Library science; Computer science; Biology; Machine learning; Biochemistry,"BACKGROUND: The application of bibliometrics in medicine enables one to analyse vast amounts of publications and their production patterns on macroscopic and microscopic levels. OBJECTIVES: The aim of the study was to analyse the historical perspective of research literature production regarding application of bibliometrics in medicine. METHODS: Publications related to application of bibliometrics in medicine from 1970 to 2018 were harvested from the Scopus bibliographic database. Reference Publication Year Spectroscopy was triangulated with the VOSViewer to identify historical roots and evolution of topics and clinical areas. RESULTS: The search resulted in 6557 publications. The literature production trend was positive. Historical roots analysis identified 33 historical roots and 16 clinical areas where bibliometrics was applied. DISCUSSION: The increase in productivity in application of bibliometrics in medicine might be attributed to increased use of quantitative metrics in research evaluation, publish or perish phenomenon and the increased use of evidence-based medicine. CONCLUSION: The trend of the literature production was positive. Medicine was in the forefront of knowledge development in bibliometrics. reference publication year spectroscopy proved to be an accurate method which was able to identify most of the historical roots.",,,,,"Peter Kokol, 2020, Health Information & Libraries Journal" +OPENALEX,W2915161772,10.1016/j.frl.2019.02.003,,"A bibliometric analysis on green finance: Current status, development, and future directions",Finance research letters,,2019,article,en,640,Dayong Zhang; Zhiwei Zhang; Shunsuke Managi,Dayong Zhang; Zhiwei Zhang; Shunsuke Managi,Southwestern University of Finance and Economics; Institute of Economics; Institute of Economics; Southwestern University of Finance and Economics; Kyushu University,,,Status quo; Climate Finance; Political science; Regional science; Management science; Economics; Sociology; Economic growth; Developing country,Status quo; Climate Finance; Political science; Regional science; Management science; Economics; Sociology; Economic growth; Developing country; Law,,,,,,"Dayong Zhang, 2019, Finance research letters" +OPENALEX,W2954472560,10.3390/su11133606,,Bibliometric Analysis on Smart Cities Research,Sustainability,,2019,article,en,395,Yiming Guo; Zhen-Ling Huang; Ji Guo; Hua Li; Xingrong Guo; Mpeoane Judith Nkeli,Yiming Guo; Zhen-Ling Huang; Ji Guo; Hua Li; Xingrong Guo; Mpeoane Judith Nkeli,Shanghai Maritime University; Shanghai Maritime University; Shanghai Maritime University; Shanghai Maritime University; Shanghai Maritime University; Shanghai Maritime University,,,Bibliometrics; Work (physics); Smart city; Field (mathematics); Domain (mathematical analysis); Web of science; Data science; Regional science; Computer science; Knowledge management; Engineering; Geography; Political science; Library science; World Wide Web; Internet of Things,Bibliometrics; Work (physics); Smart city; Field (mathematics); Domain (mathematical analysis); Web of science; Data science; Regional science; Computer science; Knowledge management; Engineering; Geography; Political science; Library science; World Wide Web; Internet of Things; Law; Mathematical analysis; Mathematics; Mechanical engineering; Pure mathematics; MEDLINE,"Smart cities have been a global concern in recent years, involving comprehensive scientific research. To obtain a structural overview and assist researchers in making insights into the characteristics of smart cities research, bibliometric analysis was carried out in this paper. With the application of the bibliometric analysis software VOSviewer and CiteSpace, 4409 smart cities were identified by the core collection of the Web of Science in publications between 1998 and 2019 and used in the analysis of this paper. Concretely, this research visually demonstrates a comprehensive overview of the field relating to smart cities in terms of the production of regular publications, main domain of smart cities researchers, most influential countries (institutions, sources and authors), and interesting research directions in the smart city researches. We also present the research collaboration among countries (regions), organizations and authors based on a series of cooperation analyses. The bibliometric analysis of the existing work provided a valuable and seminal reference for researchers and practitioners in smart cities-related research communities.",,,,,"Yiming Guo, 2019, Sustainability" +OPENALEX,W2106572956,10.1016/j.tourman.2010.07.001,,"Publish and perish? Bibliometric analysis, journal ranking and the assessment of research quality in tourism",Tourism Management,,2010,article,en,620,C. Michael Hall,C. Michael Hall,University of Canterbury; Linnaeus University; University of Oulu,,,Bibliometrics; Journal ranking; Scopus; Ranking (information retrieval); Tourism; Quality (philosophy); Context (archaeology); Publish or perish; Citation analysis; Government (linguistics); Impact factor; Publication; Data science; Citation; Regional science; Marketing; Political science; Computer science; Sociology; Business; Library science; Information retrieval; Publishing; Geography; MEDLINE; Advertising,Bibliometrics; Journal ranking; Scopus; Ranking (information retrieval); Tourism; Quality (philosophy); Context (archaeology); Publish or perish; Citation analysis; Government (linguistics); Impact factor; Publication; Data science; Citation; Regional science; Marketing; Political science; Computer science; Sociology; Business; Library science; Information retrieval; Publishing; Geography; MEDLINE; Advertising; Law; Linguistics; Epistemology; Archaeology; Philosophy,,,,,,"C. Michael Hall, 2010, Tourism Management" +OPENALEX,W4320070415,10.1186/s40561-022-00205-x,,Is Metaverse in education a blessing or a curse: a combined content and bibliometric analysis,Smart Learning Environments,,2022,article,en,587,Ahmed Tlili; Ronghuai Huang; Boulus Shehata; Dejian Liu; Jialu Zhao; Ahmed Hosny Saleh Metwally; Huanhuan Wang; Mouna Denden; Aras Bozkurt; Lik‐Hang Lee; Doğuş Beyoğlu; Fahriye Altınay; R. C. Sharma; Zehra Altınay; Zhisheng Li; Jiahao Liu; Faizan Ahmad; Ying Hu; Soheil Salha; Mourad Abed; Daniel Burgos,Ahmed Tlili; Ronghuai Huang; Boulus Shehata; Dejian Liu; Jialu Zhao; Ahmed Hosny Saleh Metwally; Huanhuan Wang; Mouna Denden; Aras Bozkurt; Lik‐Hang Lee; Doğuş Beyoğlu; Fahriye Altınay; R. C. Sharma; Zehra Altınay; Zhisheng Li; Jiahao Liu; Faizan Ahmad; Ying Hu; Soheil Salha; Mourad Abed; Daniel Burgos,"Beijing Normal University; Beijing Normal University; Beijing Normal University; Beijing Normal University; Beijing Normal University; Beijing Normal University; Beijing Normal University; Centre National de la Recherche Scientifique; Institut National des Sciences Appliquées de Rennes; Laboratoire d'Automatique, de Mécanique et d'Informatique Industrielles et Humaines; INSA Hauts-de-France; Université Polytechnique Hauts-de-France; Anadolu University; University of South Africa; Eskişehir City Hospital; Korea Advanced Institute of Science and Technology; Near East University; Near East University; Ambedkar University Delhi; Near East University; Beijing Normal University; Beijing Normal University; COMSATS University Islamabad; Beijing Normal University; Beijing Normal University; An-Najah National University; Centre National de la Recherche Scientifique; Institut National des Sciences Appliquées de Rennes; Laboratoire d'Automatique, de Mécanique et d'Informatique Industrielles et Humaines; INSA Hauts-de-France; Université Polytechnique Hauts-de-France; Universidad Internacional De La Rioja",,,Metaverse; Computer science; Human–computer interaction,Metaverse; Computer science; Human–computer interaction; Virtual reality,"Abstract The Metaverse has been the centre of attraction for educationists for quite some time. This field got renewed interest with the announcement of social media giant Facebook as it rebranding and positioning it as Meta. While several studies conducted literature reviews to summarize the findings related to the Metaverse in general, no study to the best of our knowledge focused on systematically summarizing the finding related to the Metaverse in education. To cover this gap, this study conducts a systematic literature review of the Metaverse in education. It then applies both content and bibliometric analysis to reveal the research trends, focus, and limitations of this research topic. The obtained findings reveal the research gap in lifelogging applications in educational Metaverse. The findings also show that the design of Metaverse in education has evolved over generations, where generation Z is more targeted with artificial intelligence technologies compared to generation X or Y. In terms of learning scenarios, there have been very few studies focusing on mobile learning, hybrid learning, and micro learning. Additionally, no study focused on using the Metaverse in education for students with disabilities. The findings of this study provide a roadmap of future research directions to be taken into consideration and investigated to enhance the adoption of the Metaverse in education worldwide, as well as to enhance the learning and teaching experiences in the Metaverse.",,,,,"Ahmed Tlili, 2022, Smart Learning Environments" +OPENALEX,W2510091332,10.1016/j.compedu.2016.03.010,,Virtual and remote labs in education: A bibliometric analysis,Computers & Education,,2016,article,en,562,Rubén Heradio; Luis de la Torre; Daniel Galán; Francisco Javier Cabrerizo; Enrique Herrera‐Viedma; S. Dormido,Rubén Heradio; Luis de la Torre; Daniel Galán; Francisco Javier Cabrerizo; Enrique Herrera‐Viedma; S. Dormido,Universidad Nacional de Educación a Distancia; Software (Spain); Universidad Nacional de Educación a Distancia; Universidad Nacional de Educación a Distancia; Universidad Nacional de Educación a Distancia; Software (Spain); Universidad de Granada; Universidad Nacional de Educación a Distancia,,,Scopus; Web of science; Computer science; Virtual space; Space (punctuation); World Wide Web; Data science; Multimedia; MEDLINE; Political science; Artificial intelligence,Scopus; Web of science; Computer science; Virtual space; Space (punctuation); World Wide Web; Data science; Multimedia; MEDLINE; Political science; Artificial intelligence; Operating system; Law,,,,,,"Rubén Heradio, 2016, Computers & Education" +OPENALEX,W58954717,,,How to use Bibexcel for various types of bibliometric analysis,Research at the University of Copenhagen (University of Copenhagen),,2009,article,en,624,Olle Persson; Rickard Danell; Jesper Wiborg Schneider,Olle Persson; Rickard Danell; Jesper Wiborg Schneider,Umeå University; Umeå University,,,Computer science,Computer science,"SOCIETY LAWYERS Contact Us Our Locations California Hawaii Alabama Florida Tips you should follow while hiring an experienced attorney When hiring an attorney, you want to make sure they have a track record of success, past and present. Ask your attorney about the cases he has handled and his track record. Some law firms post",,,,,"Olle Persson, 2009, Research at the University of Copenhagen (University of Copenhagen)" +OPENALEX,W3025370095,10.2196/18228,,Artificial Intelligence in Health Care: Bibliometric Analysis,Journal of Medical Internet Research,,2020,article,en,444,Yuqi Guo; Zhichao Hao; Shichong Zhao; Jiaqi Gong; Fan Yang,Yuqi Guo; Zhichao Hao; Shichong Zhao; Jiaqi Gong; Fan Yang,"University of North Carolina at Charlotte; University of Alabama; Dongbei University of Finance and Economics; University of Maryland, Baltimore; Dongbei University of Finance and Economics",,,Health care; Bibliometrics; Artificial intelligence; MEDLINE; Data science; Computer science; Medicine; Data mining; Political science,Health care; Bibliometrics; Artificial intelligence; MEDLINE; Data science; Computer science; Medicine; Data mining; Political science; Law,"BACKGROUND: As a critical driving power to promote health care, the health care-related artificial intelligence (AI) literature is growing rapidly. OBJECTIVE: The purpose of this analysis is to provide a dynamic and longitudinal bibliometric analysis of health care-related AI publications. METHODS: The Web of Science (Clarivate PLC) was searched to retrieve all existing and highly cited AI-related health care research papers published in English up to December 2019. Based on bibliometric indicators, a search strategy was developed to screen the title for eligibility, using the abstract and full text where needed. The growth rate of publications, characteristics of research activities, publication patterns, and research hotspot tendencies were computed using the HistCite software. RESULTS: The search identified 5235 hits, of which 1473 publications were included in the analyses. Publication output increased an average of 17.02% per year since 1995, but the growth rate of research papers significantly increased to 45.15% from 2014 to 2019. The major health problems studied in AI research are cancer, depression, Alzheimer disease, heart failure, and diabetes. Artificial neural networks, support vector machines, and convolutional neural networks have the highest impact on health care. Nucleosides, convolutional neural networks, and tumor markers have remained research hotspots through 2019. CONCLUSIONS: This analysis provides a comprehensive overview of the AI-related research conducted in the field of health care, which helps researchers, policy makers, and practitioners better understand the development of health care-related AI research and possible practice implications. Future AI research should be dedicated to filling in the gaps between AI health care research and clinical applications.",,,,,"Yuqi Guo, 2020, Journal of Medical Internet Research" +OPENALEX,W2886191303,10.1016/j.techfore.2018.07.006,,Knowledge management: A global examination based on bibliometric analysis,Technological Forecasting and Social Change,,2018,article,en,537,Magaly Gaviria-Marín; José M. Merigó; Hugo Baier-Fuentes,Magaly Gaviria-Marín; José M. Merigó; Hugo Baier-Fuentes,Universidad Católica de la Santísima Concepción; Universitat de Barcelona; University of Chile; University of Technology Sydney; Universidad Católica de la Santísima Concepción,,,Field (mathematics); Bibliometrics; Web of science; Computer science; Data science; Knowledge management; Library science; Political science; MEDLINE,Field (mathematics); Bibliometrics; Web of science; Computer science; Data science; Knowledge management; Library science; Political science; MEDLINE; Mathematics; Law; Pure mathematics,,,,,,"Magaly Gaviria-Marín, 2018, Technological Forecasting and Social Change" +OPENALEX,W4283591250,10.1007/s10639-022-11167-5,,Systematic literature review and bibliometric analysis on virtual reality and education,Education and Information Technologies,,2022,article,en,523,Mario Rojas Sánchez; Pedro R. Palos‐Sánchez; José Antonio Folgado-Fernández,Mario Rojas Sánchez; Pedro R. Palos‐Sánchez; José Antonio Folgado-Fernández,Instituto Tecnológico de Costa Rica; University of Beira Interior; Universidad de Sevilla; Universidad de Extremadura,,,Virtual reality; Computer science; Scopus; Subject (documents); Bibliometrics; Instructional simulation; Educational technology; Process (computing); Citation; Scientific literature; Content analysis; Data science; Mathematics education; World Wide Web; Psychology; Social science; Sociology; Human–computer interaction,Virtual reality; Computer science; Scopus; Subject (documents); Bibliometrics; Instructional simulation; Educational technology; Process (computing); Citation; Scientific literature; Content analysis; Data science; Mathematics education; World Wide Web; Psychology; Social science; Sociology; Human–computer interaction; Paleontology; Biology; Operating system; MEDLINE; Political science; Law,"The objective of this study is to identify and analyze the scientific literature with a bibliometric analysis to find the main topics, authors, sources, most cited articles, and countries in the literature on virtual reality in education. Another aim is to understand the conceptual, intellectual, and social structure of the literature on the subject and identify the knowledge base of the use of VR in education and whether it is commonly used and integrated into teaching-learning processes. To do this, articles indexed in the Main Collections of the Web of Science, Scopus and Lens were analyzed for the period 2010 to 2021. The research results are presented in two parts: the first is a quantitative analysis that provides an overview of virtual reality (VR) technology used in the educational field, with tables, graphs, and maps, highlighting the main performance indicators for the production of articles and their citation. The results obtained found a total of 718 articles of which the following were analyzed 273 published articles. The second stage consisted of an inductive type of analysis that found six major groups in the cited articles, which are instruction and learning using VR, VR learning environments, use of VR in different fields of knowledge, learning processes using VR applications or games, learning processes employing simulation, and topics published during the Covid-19 pandemic. Another important aspect to mention is that VR is used in many different areas of education, but until the beginning of the pandemic the use of this so-called ""disruptive process"" came mainly from students, Institutions were reluctant and slow to accept and include VR in the teaching-learning processes.",,,,,"Mario Rojas Sánchez, 2022, Education and Information Technologies" +OPENALEX,W2990688366,10.1016/j.jbusres.2019.11.025,,"A bibliometric analysis of board diversity: Current status, development, and future research directions",Journal of Business Research,,2019,article,en,601,H. Kent Baker; Nitesh Pandey; Satish Kumar; Arunima Haldar,H. Kent Baker; Nitesh Pandey; Satish Kumar; Arunima Haldar,American University; Malaviya National Institute of Technology Jaipur; Malaviya National Institute of Technology Jaipur,,,Diversity (politics); Nationality; Ethnic group; Bibliometrics; Field (mathematics); Gender diversity; Political science; Psychology; Library science; Immigration; Computer science; Corporate governance; Business,Diversity (politics); Nationality; Ethnic group; Bibliometrics; Field (mathematics); Gender diversity; Political science; Psychology; Library science; Immigration; Computer science; Corporate governance; Business; Law; Pure mathematics; Mathematics; Finance,,,,,,"H. Kent Baker, 2019, Journal of Business Research" +OPENALEX,W2592517713,10.1016/j.ibusrev.2017.02.007,,Bibliometric analysis of absorptive capacity,International Business Review,,2017,article,en,351,Indri Dwi Apriliyanti; Ilan Alon,Indri Dwi Apriliyanti; Ilan Alon,Universitas Gadjah Mada; University of Agder; University of Agder,,,Absorptive capacity; Categorization; Citation; Knowledge management; Knowledge transfer; Bibliometrics; Computer science; Data science; Sociology; Library science; Artificial intelligence,Absorptive capacity; Categorization; Citation; Knowledge management; Knowledge transfer; Bibliometrics; Computer science; Data science; Sociology; Library science; Artificial intelligence,,,,,,"Indri Dwi Apriliyanti, 2017, International Business Review" +OPENALEX,W4401785934,10.38124/ijisrt/ijisrt23nov2413,,"A Bibliometric Analysis of Heart Disease Detection using Artificial Intelligence Techniques: Trends, Influential Works, and Research Gaps",International Journal of Innovative Science and Research Technology (IJISRT),,2023,article,en,777,Akshat Kotadia; Bhavy Masalia; Om Mehra; Lakshin Pathak,Akshat Kotadia; Bhavy Masalia; Om Mehra; Lakshin Pathak,,,,Artificial intelligence; Computer science; Data science,Artificial intelligence; Computer science; Data science,"Advanced diagnostic techniques are required as cardiovascular diseases continue to pose a serious threat to global health. The scientific community has recently shown a great deal of interest in the application of deep learning techniques to the detection of heart disease. In order to synthesize the body of research on the use of deep learning in the detection of heart disease, this study provides a thorough bibliometric analysis. A wide variety of publications, including articles, conference papers, and reviews, are included in the analysis. These were obtained from Scopus and WoS databases. Total 662 documents are analyzed from these databases. The study looks at geographic distributions, historical trends, and influential figures in the field. We uncover key papers and authors through quantitative analyses, providing insight into the way research themes have changed over time. The study delves into co-authorship networks and institutional collaborations, offering valuable perspectives on the collaborative environment among scholars operating within this field. To find popular terms and hot topics, keyword analysis is used, which helps to provide a more sophisticated understanding of the main ideas guiding the research that is being done today.",,,,,"Akshat Kotadia, 2023, International Journal of Innovative Science and Research Technology (IJISRT)" +OPENALEX,W4385494672,10.1002/joe.22229,,Guidelines for interpreting the results of bibliometric analysis: A sensemaking approach,Global Business and Organizational Excellence,,2023,article,en,369,Weng Marc Lim; Satish Kumar,Weng Marc Lim; Satish Kumar,Swinburne University of Technology; Sunway University; Swinburne University of Technology Sarawak Campus; Indian Institute of Management Ahmedabad; Sunway University,,,Sensemaking; Interpretation (philosophy); Process (computing); Management science; Computer science; Subjectivity; Data science; Raw data; Epistemology; Knowledge management; Engineering,Sensemaking; Interpretation (philosophy); Process (computing); Management science; Computer science; Subjectivity; Data science; Raw data; Epistemology; Knowledge management; Engineering; Philosophy; Operating system; Programming language,"Abstract While bibliometric analysis is inherently quantitative and objective, it necessitates interpretation, thereby introducing an element of subjectivity. This article proposes a sensemaking approach that transitions researchers from mere description to proactive interpretation of bibliometric results, transforming raw information into informed insights. We discuss the applicability of sensemaking in bibliometric analysis and offer practical guidelines for its integration into systematic literature reviews. These guidelines revolve around a three‐stage sensemaking process—that is, scanning, sensing, and substantiating—each crucial to deriving meaningful interpretations. As such, this article serves as a valuable guide for researchers seeking to utilize bibliometric analysis as a potent analytical tool in their review studies.",,,,,"Weng Marc Lim, 2023, Global Business and Organizational Excellence" +OPENALEX,W2576786802,10.1016/j.jik.2016.12.002,,An overview of qualitative comparative analysis: A bibliometric analysis,Journal of Innovation & Knowledge,,2017,article,en,384,Norat Roig‐Tierno; Tomas F. Gonzalez-Cruz; Jordi Llopis-Martinez,Norat Roig‐Tierno; Tomas F. Gonzalez-Cruz; Jordi Llopis-Martinez,Valencian International University; Universitat de València; Universitat de València,,,Qualitative comparative analysis; Humanities; Qualitative analysis; Qualitative research; Sociology; Mathematics; Philosophy; Social science; Statistics,Qualitative comparative analysis; Humanities; Qualitative analysis; Qualitative research; Sociology; Mathematics; Philosophy; Social science; Statistics,"This study is organized in two parts. We conduct a general analysis of the use of qualitative comparative analysis (QCA), and a bibliometric study of the use of QCA to analyze the specificities of the research publications that apply this methodology. Our results show the differences in quantitative terms of the three variants of this methodology: fsQCA, csQCA, and mvQCA.",,,,,"Norat Roig‐Tierno, 2017, Journal of Innovation & Knowledge" +OPENALEX,W2919854756,10.3390/su11051377,,Tourism Research on Sustainability: A Bibliometric Analysis,Sustainability,,2019,article,en,356,Àngels Niñerola; María Victòria Sánchez Rebull; Ana Beatriz Hernández‐Lara,Àngels Niñerola; María Victòria Sánchez Rebull; Ana Beatriz Hernández‐Lara,Universitat Rovira i Virgili; Universitat Rovira i Virgili; Universitat Rovira i Virgili,,,Scopus; Sustainability; Tourism; Bibliometrics; Destinations; Regional science; Business; Geography; Marketing; Political science; Computer science; Library science; MEDLINE,Scopus; Sustainability; Tourism; Bibliometrics; Destinations; Regional science; Business; Geography; Marketing; Political science; Computer science; Library science; MEDLINE; Archaeology; Biology; Law; Ecology,"Tourism represents one of the main industries in terms of job creation and economic development while sustainability in tourism represents a worldwide challenge. The objective of the present study is to use a bibliometric approach to review the relevant literature. Bibliometric indicators, such as citations, are used to identify the field structure and the VOSviewer software is used to map the main trends in this area. Over the period 1987–2018, a total of 4647 papers were found in Scopus regarding sustainability issues in tourism. Analysis of the leading journals, authors, institutions, and keywords indicates that: (1) the literature on sustainability issues in the field of tourism is significantly growing; (2) a mere six papers accounted more than 300 citations, but there are several prolific authors; (3) of the 614 sources included in the review, the most important have published 46.7% of the papers; (4) in terms of documents and citations, the United States is the leading country in this topic; (5) according to keyword trend network analysis, sustainability is becoming a strategic approach for companies and tourist destinations. Finally, this subfield within the tourism literature has considerable potential and is expected to continue growing.",,,,,"Àngels Niñerola, 2019, Sustainability" +OPENALEX,W2150220236,10.1007/s11192-009-0146-3,,"Software survey: VOSviewer, a computer program for bibliometric mapping",Scientometrics,,2009,article,en,19703,Nees Jan van Eck; Ludo Waltman,Nees Jan van Eck; Ludo Waltman,Leiden University; Erasmus University Rotterdam; Leiden University; Erasmus University Rotterdam,,,Computer science; Construct (python library); Bibliometrics; Citation; Software; Representation (politics); Data science; World Wide Web,Computer science; Construct (python library); Bibliometrics; Citation; Software; Representation (politics); Data science; World Wide Web; Law; Political science; Politics; Programming language,"We present VOSviewer, a freely available computer program that we have developed for constructing and viewing bibliometric maps. Unlike most computer programs that are used for bibliometric mapping, VOSviewer pays special attention to the graphical representation of bibliometric maps. The functionality of VOSviewer is especially useful for displaying large bibliometric maps in an easy-to-interpret way. The paper consists of three parts. In the first part, an overview of VOSviewer's functionality for displaying bibliometric maps is provided. In the second part, the technical implementation of specific parts of the program is discussed. Finally, in the third part, VOSviewer's ability to handle large maps is demonstrated by using the program to construct and display a co-citation map of 5,000 major scientific journals.",,,,,"Nees Jan van Eck, 2009, Scientometrics" +OPENALEX,W2785537869,10.1108/ejm-11-2017-0853,,Fifty years of the European Journal of Marketing: a bibliometric analysis,European Journal of Marketing,,2018,article,en,550,Francisco J. Martínez‐López; José M. Merigó; Leslier Valenzuela‐Fernández; Carolina Nicolás,Francisco J. Martínez‐López; José M. Merigó; Leslier Valenzuela‐Fernández; Carolina Nicolás,Universidad de Granada; EAE Business School; University of Chile; University of Chile; Universidad Santo Tomás,,,Scopus; Originality; Bibliographic coupling; Citation; Bibliometrics; Library science; Productivity; Bibliographic database; European commission; Citation analysis; Impact factor; Regional science; Political science; Social science; Sociology; European union; Computer science; Business; Economics; MEDLINE; Economic growth; Law,Scopus; Originality; Bibliographic coupling; Citation; Bibliometrics; Library science; Productivity; Bibliographic database; European commission; Citation analysis; Impact factor; Regional science; Political science; Social science; Sociology; European union; Computer science; Business; Economics; MEDLINE; Economic growth; Law; Qualitative research; Economic policy,"Purpose The European Journal of Marketing was created in 1967. In 2017, the journal celebrates its 50th anniversary. Therefore, the purpose of this study is to present a bibliometric overview of the leading trends of the journal during this period. Design/methodology/approach This work uses the Scopus database to analyse the most productive authors, institutions and countries, as well as the most cited papers and the citing articles. The investigation uses bibliometric indicators to represent the bibliographic data, including the total number of publications and citations between 1967 and 2017. Additionally, the article also develops a graphical visualization of the bibliographic material by using the visualization of similarities viewer software to map journals, keywords and institutions with bibliographic coupling and co-citation analysis. Findings British authors and institutions are the most productive in the journal, although Australians’ are growing significantly the number of papers published. Continental European institutions are also increasing the number of publications, but they are still far from reaching the British contribution so far. In the mid-term, however, these zone’s authors and institutions, especially those from big European countries like France, Germany, Italy and Spain, should reach a closer performance to British ones; more as less long, historic, but more recent periods of analysis are considered. Practical implications This article is useful for any reader of this journal to understand questions such as papers’ European Journal of Marketing -related scientific productivity in terms of, for instance, contributors/authors, institutions and countries, or the main sources used to back them. Originality/value This is the first comprehensive article offering a general overview of the leading trends and researchers of the journal over its history.",,,,,"Francisco J. Martínez‐López, 2018, European Journal of Marketing" +OPENALEX,W2981634144,10.3791/58494,,"Comparing Bibliometric Analysis Using PubMed, Scopus, and Web of Science Databases",Journal of Visualized Experiments,,2019,article,en,491,Saif Aldeen AlRyalat; Lna Malkawi; Shaher Momani,Saif Aldeen AlRyalat; Lna Malkawi; Shaher Momani,University of Jordan; Yahoo (Spain); University of Jordan; University of Jordan; Northwest African American Museum; King Abdulaziz University,,,Scopus; Web of science; Computer science; Subject (documents); Scope (computer science); Bibliometrics; Information retrieval; Multidisciplinary approach; Database; MEDLINE; Bibliographic database; Protocol (science); World Wide Web; Data science; Medicine; Political science,Scopus; Web of science; Computer science; Subject (documents); Scope (computer science); Bibliometrics; Information retrieval; Multidisciplinary approach; Database; MEDLINE; Bibliographic database; Protocol (science); World Wide Web; Data science; Medicine; Political science; Alternative medicine; Law; Programming language; Pathology,"Literature databases (i.e., PubMed, Scopus, and Web of Science) differ in terms of their coverage, focus, and the tool they provide. PubMed focuses mainly on life sciences and biomedical disciplines, whereas Scopus and Web of Science are multidisciplinary. The protocol described in the current study was used to search for publications from Jordanian authors in the years 2013-2017. In this protocol, how to use each database to conduct this type of search is explained in detail. A Scopus search resulted in the highest number of documents (11,444 documents), followed by a Web of Science search (10,943 documents). PubMed resulted in a smaller number of documents due to its narrower scope and coverage (4,363 documents). The results also show a yearly trend in: (1) the number of publications, (2) the disciplines that have the most publications, (3) the countries of collaboration, and (4) the number of open access publications. In contrast, PubMed has a sophisticated keyword optimization service (i.e., Medical Subject Heading, or MeSH), while both Scopus and Web of Science provide search analysis tools that can produce representative figures. Finally, the features of each database are explained in detail and several indices that can be extracted using the search results are provided. This study provides a base for using literature databases for bibliometric analysis.",,,,,"Saif Aldeen AlRyalat, 2019, Journal of Visualized Experiments" +OPENALEX,W2191867853,10.1016/j.jbusres.2015.10.054,,A bibliometric analysis of international impact of business incubators,Journal of Business Research,,2015,article,en,343,Gema Albort-Morant; Domingo Ribeiro Soriano,Gema Albort-Morant; Domingo Ribeiro Soriano,Universitat de València; Universitat de València,,,Bibliometrics; Productivity; Web of science; Cover (algebra); Regional science; Library science; Business; Political science; Computer science; Sociology; Economics; Engineering; Economic growth; MEDLINE,Bibliometrics; Productivity; Web of science; Cover (algebra); Regional science; Library science; Business; Political science; Computer science; Sociology; Economics; Engineering; Economic growth; MEDLINE; Law; Mechanical engineering,,,,,,"Gema Albort-Morant, 2015, Journal of Business Research" +OPENALEX,W2793000158,10.1016/j.jbusres.2017.12.054,,A bibliometric analysis of born global firms,Journal of Business Research,,2018,article,en,304,Piotr Dzikowski,Piotr Dzikowski,University of Zielona Góra,,,Citation; Citation analysis; Bibliometrics; Productivity; Web of science; Regional science; Library science; Political science; Sociology; Economics; Computer science; Economic growth; MEDLINE; Law,Citation; Citation analysis; Bibliometrics; Productivity; Web of science; Regional science; Library science; Political science; Sociology; Economics; Computer science; Economic growth; MEDLINE; Law,,,,,,"Piotr Dzikowski, 2018, Journal of Business Research" +OPENALEX,W2610818236,10.1016/j.jclepro.2017.05.018,,Corporate social responsibility for supply chain management: A literature review and bibliometric analysis,Journal of Cleaner Production,,2017,review,en,495,Yunting Feng; Qinghua Zhu; Kee‐hung Lai,Yunting Feng; Qinghua Zhu; Kee‐hung Lai,Shanghai Jiao Tong University; Shanghai Jiao Tong University; Hong Kong Polytechnic University,,,Corporate social responsibility; Stakeholder; Normative; Social network analysis; Supply chain; Knowledge management; Supply chain management; Citation analysis; Business; Citation; Field (mathematics); Sociology; Management science; Computer science; Political science; Marketing; Public relations; Engineering; Social science,Corporate social responsibility; Stakeholder; Normative; Social network analysis; Supply chain; Knowledge management; Supply chain management; Citation analysis; Business; Citation; Field (mathematics); Sociology; Management science; Computer science; Political science; Marketing; Public relations; Engineering; Social science; Law; Social capital; Pure mathematics; Mathematics; World Wide Web,,,,,,"Yunting Feng, 2017, Journal of Cleaner Production" +OPENALEX,W2072689080,10.1080/09669582.2014.978790,,Trends and patterns in sustainable tourism research: a 25-year bibliometric analysis,Journal of Sustainable Tourism,,2015,article,en,439,Lisa Ruhanen; Betty Weiler; Brent Moyle; Char-lee McLennan,Lisa Ruhanen; Betty Weiler; Brent Moyle; Char-lee McLennan,University of Queensland; Southern Cross University; Southern Cross University; Griffith University,,,Tourism; Sustainable tourism; Regional science; Bibliometrics; Empirical research; Tourism geography; Sustainable development; Criticism; Sustainability; Social science; Political science; Sociology; Library science; Epistemology,Tourism; Sustainable tourism; Regional science; Bibliometrics; Empirical research; Tourism geography; Sustainable development; Criticism; Sustainability; Social science; Political science; Sociology; Library science; Epistemology; Ecology; Computer science; Biology; Philosophy; Law,"In the quarter of a century since the release of the 1987 Brundtland Report, sustainable tourism has emerged as the dominant paradigm in tourism development. However, the debate, discourse, and criticism of this subfield of tourism research continues. To address such concerns the purpose of this paper is to explore trends and patterns in sustainable tourism research over the past 25 years. A 25-year bibliometric analysis was conducted for the four highest ranked journals in the tourism field. Results indicate that the growth in sustainable tourism research has been remarkable, with 492 papers published in these four journals and almost half of these in the last two years of the analysis. The largest proportion of papers published on sustainable tourism was case studies, empirical studies, and critical reviews. This study found that while the theoretical and methodological approaches appear to have matured over time, the subjects and themes in sustainable tourism research, with some exceptions, have remained constant. However, the field is clearly maturing with a move away from definitional and conceptual papers to papers focused on testing and applying theory through empirical research.",,,,,"Lisa Ruhanen, 2015, Journal of Sustainable Tourism" +OPENALEX,W3125707221,10.1177/1094428114562629,,Bibliometric Methods in Management and Organization,Organizational Research Methods,,2014,article,en,6624,Ivan Župič; Tomaž Čater,Ivan Župič; Tomaž Čater,University of Ljubljana; University of Ljubljana,,,Bibliographic coupling; Citation analysis; Citation; Objectivity (philosophy); Bibliometrics; Workflow; Computer science; Co-citation; Data science; Field (mathematics); Management science; Sociology; Knowledge management; Library science; Epistemology; Database; Engineering,Bibliographic coupling; Citation analysis; Citation; Objectivity (philosophy); Bibliometrics; Workflow; Computer science; Co-citation; Data science; Field (mathematics); Management science; Sociology; Knowledge management; Library science; Epistemology; Database; Engineering; Mathematics; Philosophy; Pure mathematics,"We aim to develop a meaningful single-source reference for management and organization scholars interested in using bibliometric methods for mapping research specialties. Such methods introduce a measure of objectivity into the evaluation of scientific literature and hold the potential to increase rigor and mitigate researcher bias in reviews of scientific literature by aggregating the opinions of multiple scholars working in the field. We introduce the bibliometric methods of citation analysis, co-citation analysis, bibliographical coupling, co-author analysis, and co-word analysis and present a workflow for conducting bibliometric studies with guidelines for researchers. We envision that bibliometric methods will complement meta-analysis and qualitative structured literature reviews as a method for reviewing and evaluating scientific literature. To demonstrate bibliometric methods, we performed a citation and co-citation analysis to map the intellectual structure of the Organizational Research Methods journal.",,,,,"Ivan Župič, 2014, Organizational Research Methods" +OPENALEX,W3198357836,10.1016/j.jbef.2021.100577,,"Artificial intelligence and machine learning in finance: Identifying foundations, themes, and research clusters from bibliometric analysis",Journal of Behavioral and Experimental Finance,,2021,article,en,665,John W. Goodell; Satish Kumar; Weng Marc Lim; Debidutta Pattnaik,John W. Goodell; Satish Kumar; Weng Marc Lim; Debidutta Pattnaik,University of Akron; Malaviya National Institute of Technology Jaipur; Swinburne University of Technology Sarawak Campus; Swinburne University of Technology Sarawak Campus; Woxsen School of Business; Malaviya National Institute of Technology Jaipur,,,Scholarship; Bibliographic coupling; Valuation (finance); Corporate finance; Finance; Citation; Portfolio; Artificial intelligence; Sociology; Economics; Computer science; Library science,Scholarship; Bibliographic coupling; Valuation (finance); Corporate finance; Finance; Citation; Portfolio; Artificial intelligence; Sociology; Economics; Computer science; Library science; Economic growth,,,,,,"John W. Goodell, 2021, Journal of Behavioral and Experimental Finance" +OPENALEX,W1743190515,10.1007/s11192-015-1747-7,,Economics in Latin America: a bibliometric analysis,Scientometrics,,2015,article,en,346,Claudio A. Bonilla; José M. Merigó; Carolina Torres-Abad,Claudio A. Bonilla; José M. Merigó; Carolina Torres-Abad,University of Chile; University of Chile; University of Chile,,,Bibliometrics; Latin Americans; Web of science; Per capita; Regional science; Scientometrics; Scopus; Order (exchange); Library science; Political science; Geography; Economics; Demography; Sociology; MEDLINE; Computer science; Population,Bibliometrics; Latin Americans; Web of science; Per capita; Regional science; Scientometrics; Scopus; Order (exchange); Library science; Political science; Geography; Economics; Demography; Sociology; MEDLINE; Computer science; Population; Law; Finance,,,,,,"Claudio A. Bonilla, 2015, Scientometrics" +OPENALEX,W3183627559,10.1016/j.jbusres.2021.07.015,,Mapping the electronic word-of-mouth (eWOM) research: A systematic review and bibliometric analysis,Journal of Business Research,,2021,review,en,455,Naveen Donthu; Satish Kumar; Neeraj Pandey; Nitesh Pandey; Akanksha Mishra,Naveen Donthu; Satish Kumar; Neeraj Pandey; Nitesh Pandey; Akanksha Mishra,Georgia State University; Swinburne University of Technology Sarawak Campus; Malaviya National Institute of Technology Jaipur; National Institute of Industrial Engineering; Malaviya National Institute of Technology Jaipur; National Institute of Industrial Engineering,,,Word of mouth; Hospitality; Social media; Service (business); Loyalty; Marketing; Field (mathematics); Focus (optics); Tourism; Content analysis; Advertising; Sociology; Business; Psychology; Computer science; Political science; World Wide Web; Social science,Word of mouth; Hospitality; Social media; Service (business); Loyalty; Marketing; Field (mathematics); Focus (optics); Tourism; Content analysis; Advertising; Sociology; Business; Psychology; Computer science; Political science; World Wide Web; Social science; Law; Pure mathematics; Physics; Optics; Mathematics,,,,,,"Naveen Donthu, 2021, Journal of Business Research" +OPENALEX,W2943541748,10.1016/j.cities.2019.04.015,,Neighbourhood walkability: A review and bibliometric analysis,Cities,,2019,review,en,290,Hao Wang; Yuqi Yang,Hao Wang; Yuqi Yang,Central University of Finance and Economics; Central University of Finance and Economics,,,Walkability; Neighbourhood (mathematics); Built environment; Geography; Transport engineering; Environmental planning; Environmental health; Civil engineering; Medicine; Engineering,Walkability; Neighbourhood (mathematics); Built environment; Geography; Transport engineering; Environmental planning; Environmental health; Civil engineering; Medicine; Engineering; Mathematics; Mathematical analysis,,,,,,"Hao Wang, 2019, Cities" diff --git a/www/services/bibliometrix_etl/outputs/standardized_scopus_sample.csv b/www/services/bibliometrix_etl/outputs/standardized_scopus_sample.csv new file mode 100644 index 000000000..8c0277eee --- /dev/null +++ b/www/services/bibliometrix_etl/outputs/standardized_scopus_sample.csv @@ -0,0 +1,4 @@ +DB,UT,DI,PMID,TI,SO,JI,PY,DT,LA,TC,AU,AF,C1,RP,CR,DE,ID,AB,VL,IS,BP,EP,SR +SCOPUS,SCOPUS-ID-001,10.1000/sample1,,Bibliometric Analysis of Artificial Intelligence Research,Journal of Data Science,,2024,Article,English,15,Smith J.; Rahman A.,"Smith, John; Rahman, Ahmed",Nanjing University of Information Science and Technology; University of Dhaka,,Reference A; Reference B; Reference C,bibliometrics; artificial intelligence; research trends,data science; scientometrics,This study analyzes artificial intelligence research using bibliometric methods.,12,2,101,115,"Smith J., 2024, Journal of Data Science" +SCOPUS,SCOPUS-ID-002,10.1000/sample2,,OpenAlex Data Standardization for Bibliometrix Python,Scientometrics Review,,2023,Conference Paper,English,9,Chen L.; Karim M.,"Chen, Li; Karim, Mohammad",Nanjing University of Information Science and Technology,,Reference X; Reference Y,OpenAlex; ETL; bibliometrix; Python,metadata; data pipeline,This paper discusses data standardization challenges in Python bibliometric tools.,8,1,55,70,"Chen L., 2023, Scientometrics Review" +SCOPUS,SCOPUS-ID-003,10.1000/sample3,,A Source-Agnostic ETL Pipeline for Bibliographic Data,International Journal of Information Systems,,2022,Article,English,22,Lee K.; Hasan R.,"Lee, Kim; Hasan, Rakib",University of Malaya; Nanjing University of Information Science and Technology,,Reference M; Reference N; Reference O,ETL; bibliographic data; data transformation,information systems; metadata conversion,The study proposes an ETL pipeline for heterogeneous bibliographic data sources.,15,4,201,220,"Lee K., 2022, International Journal of Information Systems" diff --git a/www/services/bibliometrix_etl/outputs/validation_report_openalex.txt b/www/services/bibliometrix_etl/outputs/validation_report_openalex.txt new file mode 100644 index 000000000..ef9b1ddbd --- /dev/null +++ b/www/services/bibliometrix_etl/outputs/validation_report_openalex.txt @@ -0,0 +1,5 @@ +Bibliometrix ETL Validation Report +================================= + +STATUS: PASSED +No validation errors found. diff --git a/www/services/bibliometrix_etl/outputs/validation_report_scopus.txt b/www/services/bibliometrix_etl/outputs/validation_report_scopus.txt new file mode 100644 index 000000000..ef9b1ddbd --- /dev/null +++ b/www/services/bibliometrix_etl/outputs/validation_report_scopus.txt @@ -0,0 +1,5 @@ +Bibliometrix ETL Validation Report +================================= + +STATUS: PASSED +No validation errors found. diff --git a/www/services/bibliometrix_etl/requirements.txt b/www/services/bibliometrix_etl/requirements.txt new file mode 100644 index 000000000..c43b3199b --- /dev/null +++ b/www/services/bibliometrix_etl/requirements.txt @@ -0,0 +1,3 @@ +pandas +requests +openpyxl \ No newline at end of file diff --git a/www/services/bibliometrix_etl/src/analysis_validation.py b/www/services/bibliometrix_etl/src/analysis_validation.py new file mode 100644 index 000000000..96a08e248 --- /dev/null +++ b/www/services/bibliometrix_etl/src/analysis_validation.py @@ -0,0 +1,164 @@ +""" +Analysis validation module for the Bibliometrix ETL project. + +This file tests whether the standardized WoS-like CSV outputs can be used +for basic bibliometric-style analytical functions. + +It validates both: +1. Base-level output: standardized_scopus_sample.csv +2. Advanced-level output: standardized_openalex_api.csv + +The generated report is saved in: +outputs/analysis_validation_report.txt +""" + +from pathlib import Path +import pandas as pd + + +PROJECT_ROOT = Path(__file__).resolve().parents[1] +OUTPUTS_DIR = PROJECT_ROOT / "outputs" + +SCOPUS_OUTPUT = OUTPUTS_DIR / "standardized_scopus_sample.csv" +OPENALEX_OUTPUT = OUTPUTS_DIR / "standardized_openalex_api.csv" +REPORT_OUTPUT = OUTPUTS_DIR / "analysis_validation_report.txt" + + +def split_semicolon_values(series: pd.Series) -> pd.Series: + """ + Split semicolon-delimited values into separate rows. + + Example: + "AI; bibliometrics; ETL" becomes three separate values. + """ + values = [] + + for item in series.dropna(): + text = str(item).strip() + + if text == "": + continue + + parts = [part.strip() for part in text.split(";") if part.strip()] + values.extend(parts) + + return pd.Series(values) + + +def validate_dataset(df: pd.DataFrame, dataset_name: str) -> str: + """ + Run bibliometric-style validation analyses on a standardized dataset. + """ + report_lines = [] + + report_lines.append("=" * 70) + report_lines.append(f"Analysis Validation for: {dataset_name}") + report_lines.append("=" * 70) + + # Analysis 1: record count + report_lines.append("\n1. Total Records") + report_lines.append(f"Total records: {len(df)}") + + # Analysis 2: publications by year + report_lines.append("\n2. Publications by Year") + if "PY" in df.columns: + year_counts = df["PY"].astype(str).value_counts().sort_index() + report_lines.append(year_counts.to_string()) + else: + report_lines.append("PY column not found.") + + # Analysis 3: top source titles + report_lines.append("\n3. Top Source Titles") + if "SO" in df.columns: + top_sources = df["SO"].replace("", pd.NA).dropna().value_counts().head(10) + if len(top_sources) > 0: + report_lines.append(top_sources.to_string()) + else: + report_lines.append("No source title data available.") + else: + report_lines.append("SO column not found.") + + # Analysis 4: top authors + report_lines.append("\n4. Top Authors") + if "AU" in df.columns: + authors = split_semicolon_values(df["AU"]) + top_authors = authors.value_counts().head(10) + if len(top_authors) > 0: + report_lines.append(top_authors.to_string()) + else: + report_lines.append("No author data available.") + else: + report_lines.append("AU column not found.") + + # Analysis 5: top keywords / index terms + report_lines.append("\n5. Top Keywords or Index Terms") + keyword_column = "DE" if "DE" in df.columns else "ID" + + if keyword_column in df.columns: + keywords = split_semicolon_values(df[keyword_column]) + top_keywords = keywords.value_counts().head(10) + if len(top_keywords) > 0: + report_lines.append(top_keywords.to_string()) + else: + report_lines.append("No keyword data available.") + else: + report_lines.append("DE/ID columns not found.") + + # Analysis 6: citation summary + report_lines.append("\n6. Citation Summary") + if "TC" in df.columns: + citation_series = pd.to_numeric(df["TC"], errors="coerce").fillna(0) + report_lines.append(f"Total citations: {int(citation_series.sum())}") + report_lines.append(f"Average citations: {citation_series.mean():.2f}") + report_lines.append(f"Maximum citations: {int(citation_series.max())}") + else: + report_lines.append("TC column not found.") + + report_lines.append("\nValidation Status: PASSED") + report_lines.append( + "The standardized CSV file can be used for bibliometric-style analysis." + ) + + return "\n".join(report_lines) + + +def main() -> None: + """ + Run analysis validation for all generated standardized outputs. + """ + print("Starting analysis validation...") + + all_reports = [] + + if SCOPUS_OUTPUT.exists(): + scopus_df = pd.read_csv(SCOPUS_OUTPUT) + scopus_report = validate_dataset(scopus_df, "Base Level - Scopus Local File") + all_reports.append(scopus_report) + print("Scopus analysis validation completed.") + else: + all_reports.append(f"Missing file: {SCOPUS_OUTPUT}") + print(f"Missing file: {SCOPUS_OUTPUT}") + + if OPENALEX_OUTPUT.exists(): + openalex_df = pd.read_csv(OPENALEX_OUTPUT) + openalex_report = validate_dataset(openalex_df, "Advanced Level - OpenAlex API") + all_reports.append(openalex_report) + print("OpenAlex analysis validation completed.") + else: + all_reports.append(f"Missing file: {OPENALEX_OUTPUT}") + print(f"Missing file: {OPENALEX_OUTPUT}") + + final_report = "\n\n".join(all_reports) + + with open(REPORT_OUTPUT, "w", encoding="utf-8") as file: + file.write("Bibliometrix ETL Analysis Validation Report\n") + file.write("=" * 70) + file.write("\n\n") + file.write(final_report) + + print(f"Saved analysis validation report: {REPORT_OUTPUT}") + print("ANALYSIS VALIDATION COMPLETED") + + +if __name__ == "__main__": + main() \ No newline at end of file diff --git a/www/services/bibliometrix_etl/src/extractors.py b/www/services/bibliometrix_etl/src/extractors.py new file mode 100644 index 000000000..b8a370ea4 --- /dev/null +++ b/www/services/bibliometrix_etl/src/extractors.py @@ -0,0 +1,273 @@ +""" +Extraction module for the Bibliometrix ETL project. + +This file contains functions for: +1. Reading manually downloaded local files for the base level. +2. Retrieving records from the OpenAlex API for the advanced level. + +The extracted data is returned as Python dictionaries or pandas DataFrames. +""" + +from pathlib import Path +import time +from typing import List, Dict, Any + +import pandas as pd +import requests + +from utils import reconstruct_openalex_abstract + + +def extract_local_file(file_path: str, source: str) -> pd.DataFrame: + """ + Extract bibliographic records from a local file. + + Supported file types: + - CSV for Scopus + - XLSX for Dimensions + - TXT for PubMed-style records + + Parameters + ---------- + file_path: + Path to the input file. + + source: + Name of the source database, such as SCOPUS, DIMENSIONS, or PUBMED. + + Returns + ------- + pandas.DataFrame + Raw extracted data. + """ + path = Path(file_path) + + if not path.exists(): + raise FileNotFoundError(f"File not found: {file_path}") + + extension = path.suffix.lower() + + if extension == ".csv": + return pd.read_csv(path) + + if extension in [".xlsx", ".xls"]: + return pd.read_excel(path) + + if extension == ".txt": + return parse_pubmed_txt(path) + + raise ValueError(f"Unsupported file type: {extension}") + + +def parse_pubmed_txt(file_path: Path) -> pd.DataFrame: + """ + Parse a simple PubMed-style TXT export. + + PubMed text exports often store fields like: + PMID- 123456 + TI - Article title + AU - Author Name + + This parser groups records and converts them into a DataFrame. + """ + records = [] + current_record = {} + + with open(file_path, "r", encoding="utf-8", errors="ignore") as file: + for line in file: + line = line.rstrip("\n") + + if line.strip() == "": + if current_record: + records.append(current_record) + current_record = {} + continue + + if "-" in line[:6]: + tag = line[:4].strip() + value = line[6:].strip() + + if tag in current_record: + if isinstance(current_record[tag], list): + current_record[tag].append(value) + else: + current_record[tag] = [current_record[tag], value] + else: + current_record[tag] = value + + else: + # Continuation line + if current_record: + last_key = list(current_record.keys())[-1] + if isinstance(current_record[last_key], list): + current_record[last_key][-1] += " " + line.strip() + else: + current_record[last_key] += " " + line.strip() + + if current_record: + records.append(current_record) + + return pd.DataFrame(records) + + +def fetch_openalex_records( + query: str, + max_records: int = 100, + per_page: int = 50, + sleep_seconds: float = 1.0 +) -> List[Dict[str, Any]]: + """ + Retrieve bibliographic records from the OpenAlex API. + + This function supports simple pagination and retry behavior. + + Parameters + ---------- + query: + Search query, for example "machine learning". + + max_records: + Maximum number of records to retrieve. + + per_page: + Number of records per page. + + sleep_seconds: + Waiting time between API requests. + + Returns + ------- + list[dict] + List of raw OpenAlex records. + """ + base_url = "https://api.openalex.org/works" + records = [] + page = 1 + + while len(records) < max_records: + params = { + "search": query, + "per-page": per_page, + "page": page + } + + print(f"Fetching OpenAlex page {page}...") + + response = None + + for attempt in range(3): + try: + response = requests.get(base_url, params=params, timeout=30) + + if response.status_code == 200: + break + + print(f"API status {response.status_code}. Retrying...") + time.sleep(sleep_seconds) + + except requests.RequestException as error: + print(f"Request error: {error}. Retrying...") + time.sleep(sleep_seconds) + + if response is None or response.status_code != 200: + print("OpenAlex request failed. Stopping retrieval.") + break + + data = response.json() + page_results = data.get("results", []) + + if not page_results: + break + + records.extend(page_results) + + if len(records) >= max_records: + break + + page += 1 + time.sleep(sleep_seconds) + + return records[:max_records] + + +def normalize_openalex_records(records: List[Dict[str, Any]]) -> pd.DataFrame: + """ + Convert raw OpenAlex JSON records into a flat DataFrame. + + This does not yet convert to WoS schema. + It only flattens useful OpenAlex fields so that the transformer can map them. + """ + rows = [] + + for record in records: + authors = [] + author_full_names = [] + affiliations = [] + + for authorship in record.get("authorships", []): + author = authorship.get("author", {}) + display_name = author.get("display_name", "") + + if display_name: + authors.append(display_name) + author_full_names.append(display_name) + + institutions = authorship.get("institutions", []) + for institution in institutions: + institution_name = institution.get("display_name", "") + if institution_name: + affiliations.append(institution_name) + + source_name = "" + journal_abbreviation = "" + + primary_location = record.get("primary_location") or {} + source = primary_location.get("source") or {} + + if isinstance(source, dict): + source_name = source.get("display_name", "") or "" + journal_abbreviation = source.get("abbreviated_title", "") or "" + + keywords = [] + for keyword in record.get("keywords", []) or []: + if isinstance(keyword, dict) and keyword.get("display_name"): + keywords.append(keyword.get("display_name")) + + concepts = [] + for concept in record.get("concepts", []) or []: + if isinstance(concept, dict) and concept.get("display_name"): + concepts.append(concept.get("display_name")) + + abstract = reconstruct_openalex_abstract(record.get("abstract_inverted_index")) + + row = { + "id": record.get("id", ""), + "doi": record.get("doi", ""), + "display_name": record.get("display_name", ""), + "publication_year": record.get("publication_year", ""), + "cited_by_count": record.get("cited_by_count", 0), + "type": record.get("type", ""), + "language": record.get("language", ""), + "abstract": abstract, + "source": source_name, + "journal_abbreviation": journal_abbreviation, + "authors": authors, + "author_full_names": author_full_names, + "affiliations": affiliations, + "keywords": keywords, + "concepts": concepts + } + + rows.append(row) + + return pd.DataFrame(rows) + + +def extract_openalex(query: str, max_records: int = 100) -> pd.DataFrame: + """ + Complete OpenAlex extraction function. + + It retrieves raw OpenAlex records and normalizes them into a flat DataFrame. + """ + raw_records = fetch_openalex_records(query=query, max_records=max_records) + return normalize_openalex_records(raw_records) \ No newline at end of file diff --git a/www/services/bibliometrix_etl/src/main.py b/www/services/bibliometrix_etl/src/main.py new file mode 100644 index 000000000..eab78f951 --- /dev/null +++ b/www/services/bibliometrix_etl/src/main.py @@ -0,0 +1,249 @@ +""" +Main execution file for the Bibliometrix ETL project. + +This script demonstrates both project levels: + +BASE LEVEL: +- Reads a manually downloaded/local Scopus-like CSV file. +- Converts it into a Web of Science-like standardized format. + +ADVANCED LEVEL: +- Retrieves records from OpenAlex API using a query. +- Converts the API records into the same standardized format. + +Both levels reuse the same transformation and validation pipeline. +""" + +from pathlib import Path +import pandas as pd + +from extractors import extract_local_file, extract_openalex +from transformer import transform_to_wos, save_standardized_csv, prepare_for_csv +from validator import validate_dataframe, save_validation_report, print_validation_result + + +# --------------------------------------------------------- +# Project paths +# --------------------------------------------------------- + +PROJECT_ROOT = Path(__file__).resolve().parents[1] + +DATA_RAW_DIR = PROJECT_ROOT / "data_raw" +OUTPUTS_DIR = PROJECT_ROOT / "outputs" + +DATA_RAW_DIR.mkdir(exist_ok=True) +OUTPUTS_DIR.mkdir(exist_ok=True) + + +# --------------------------------------------------------- +# Base Level Demo Data +# --------------------------------------------------------- + +def create_sample_scopus_file() -> Path: + """ + Create a small Scopus-like CSV file for the base-level demonstration. + + In a real project, this file can be replaced by a manually downloaded + Scopus CSV export. + """ + sample_path = DATA_RAW_DIR / "scopus_sample.csv" + + if sample_path.exists(): + print(f"Sample Scopus file already exists: {sample_path}") + return sample_path + + sample_data = [ + { + "Authors": "Smith J.; Rahman A.", + "Author full names": "Smith, John; Rahman, Ahmed", + "Title": "Bibliometric Analysis of Artificial Intelligence Research", + "Year": 2024, + "Source title": "Journal of Data Science", + "Volume": "12", + "Issue": "2", + "Page start": "101", + "Page end": "115", + "Cited by": 15, + "DOI": "https://doi.org/10.1000/sample1", + "Abstract": "This study analyzes artificial intelligence research using bibliometric methods.", + "Author Keywords": "bibliometrics; artificial intelligence; research trends", + "Index Keywords": "data science; scientometrics", + "Affiliations": "Nanjing University of Information Science and Technology; University of Dhaka", + "References": "Reference A; Reference B; Reference C", + "Document Type": "Article", + "Language of Original Document": "English", + "EID": "SCOPUS-ID-001" + }, + { + "Authors": "Chen L.; Karim M.", + "Author full names": "Chen, Li; Karim, Mohammad", + "Title": "OpenAlex Data Standardization for Bibliometrix Python", + "Year": 2023, + "Source title": "Scientometrics Review", + "Volume": "8", + "Issue": "1", + "Page start": "55", + "Page end": "70", + "Cited by": 9, + "DOI": "doi:10.1000/sample2", + "Abstract": "This paper discusses data standardization challenges in Python bibliometric tools.", + "Author Keywords": "OpenAlex; ETL; bibliometrix; Python", + "Index Keywords": "metadata; data pipeline", + "Affiliations": "Nanjing University of Information Science and Technology", + "References": "Reference X; Reference Y", + "Document Type": "Conference Paper", + "Language of Original Document": "English", + "EID": "SCOPUS-ID-002" + }, + { + "Authors": "Lee K.; Hasan R.", + "Author full names": "Lee, Kim; Hasan, Rakib", + "Title": "A Source-Agnostic ETL Pipeline for Bibliographic Data", + "Year": 2022, + "Source title": "International Journal of Information Systems", + "Volume": "15", + "Issue": "4", + "Page start": "201", + "Page end": "220", + "Cited by": 22, + "DOI": "10.1000/sample3", + "Abstract": "The study proposes an ETL pipeline for heterogeneous bibliographic data sources.", + "Author Keywords": "ETL; bibliographic data; data transformation", + "Index Keywords": "information systems; metadata conversion", + "Affiliations": "University of Malaya; Nanjing University of Information Science and Technology", + "References": "Reference M; Reference N; Reference O", + "Document Type": "Article", + "Language of Original Document": "English", + "EID": "SCOPUS-ID-003" + } + ] + + df = pd.DataFrame(sample_data) + df.to_csv(sample_path, index=False, encoding="utf-8-sig") + + print(f"Created sample Scopus file: {sample_path}") + + return sample_path + + +# --------------------------------------------------------- +# Base Level Pipeline +# --------------------------------------------------------- + +def run_base_level_pipeline() -> None: + """ + Run the base-level ETL pipeline using a local Scopus-like CSV file. + """ + print("\n========================================") + print("BASE LEVEL: Local File ETL") + print("========================================") + + input_file = create_sample_scopus_file() + + raw_df = extract_local_file(str(input_file), source="SCOPUS") + print(f"Extracted local records: {len(raw_df)}") + + standardized_df = transform_to_wos(raw_df, source="SCOPUS") + print("Transformed local records into WoS-like schema.") + + print("\nFirst 5 normalized Scopus rows:") + print(prepare_for_csv(standardized_df).head(5)) + + first_5_path = OUTPUTS_DIR / "scopus_first_5_normalized_rows.csv" + prepare_for_csv(standardized_df).head(5).to_csv( + first_5_path, + index=False, + encoding="utf-8-sig" + ) + print(f"Saved first 5 normalized Scopus rows: {first_5_path}") + + errors = validate_dataframe(standardized_df) + print_validation_result(errors) + + output_csv = OUTPUTS_DIR / "standardized_scopus_sample.csv" + validation_report = OUTPUTS_DIR / "validation_report_scopus.txt" + + save_standardized_csv(standardized_df, str(output_csv)) + save_validation_report(errors, str(validation_report)) + + +# --------------------------------------------------------- +# Advanced Level Pipeline +# --------------------------------------------------------- + +def run_advanced_level_pipeline() -> None: + """ + Run the advanced-level ETL pipeline using OpenAlex API. + """ + print("\n========================================") + print("ADVANCED LEVEL: OpenAlex API ETL") + print("========================================") + + query = "bibliometric analysis" + max_records = 50 + + print(f"OpenAlex query: {query}") + print(f"Maximum records: {max_records}") + + try: + raw_df = extract_openalex(query=query, max_records=max_records) + + if raw_df.empty: + print("No OpenAlex records retrieved. Skipping advanced pipeline.") + return + + print(f"Extracted OpenAlex records: {len(raw_df)}") + + raw_output = OUTPUTS_DIR / "raw_openalex_records.csv" + raw_df.to_csv(raw_output, index=False, encoding="utf-8-sig") + print(f"Saved raw OpenAlex records: {raw_output}") + + standardized_df = transform_to_wos(raw_df, source="OPENALEX") + print("Transformed OpenAlex records into WoS-like schema.") + + print("\nFirst 5 normalized OpenAlex rows:") + print(prepare_for_csv(standardized_df).head(5)) + + first_5_path = OUTPUTS_DIR / "openalex_first_5_normalized_rows.csv" + prepare_for_csv(standardized_df).head(5).to_csv( + first_5_path, + index=False, + encoding="utf-8-sig" + ) + print(f"Saved first 5 normalized OpenAlex rows: {first_5_path}") + + errors = validate_dataframe(standardized_df) + print_validation_result(errors) + + output_csv = OUTPUTS_DIR / "standardized_openalex_api.csv" + validation_report = OUTPUTS_DIR / "validation_report_openalex.txt" + + save_standardized_csv(standardized_df, str(output_csv)) + save_validation_report(errors, str(validation_report)) + + except Exception as error: + print("Advanced OpenAlex pipeline failed.") + print("Error:", error) + + +# --------------------------------------------------------- +# Main +# --------------------------------------------------------- + +def main() -> None: + """ + Execute the complete ETL demonstration. + """ + print("Bibliometrix Python ETL Project Started") + + run_base_level_pipeline() + run_advanced_level_pipeline() + + print("\n========================================") + print("PROJECT EXECUTION COMPLETED") + print("========================================") + print("Check the outputs folder for generated CSV and validation reports.") + + +if __name__ == "__main__": + main() \ No newline at end of file diff --git a/www/services/bibliometrix_etl/src/mappings.py b/www/services/bibliometrix_etl/src/mappings.py new file mode 100644 index 000000000..2efacd4ac --- /dev/null +++ b/www/services/bibliometrix_etl/src/mappings.py @@ -0,0 +1,110 @@ +""" +Mapping dictionaries and target schema for the Bibliometrix ETL project. + +This file contains: +1. The required Web of Science style target columns. +2. Multi-value fields that must behave like lists. +3. Source-specific mappings from raw data fields to WoS field tags. +""" + +# Final standard WoS-like schema required by Bibliometrix-Python +TARGET_COLUMNS = [ + "DB", "UT", "DI", "PMID", "TI", "SO", "JI", "PY", "DT", "LA", "TC", + "AU", "AF", "C1", "RP", "CR", "DE", "ID", "AB", "VL", "IS", "BP", "EP", "SR" +] + +# Fields that contain multiple values +MULTI_VALUE_COLUMNS = ["AU", "AF", "C1", "CR", "DE", "ID"] + +# Fields that should be numeric +INTEGER_COLUMNS = ["TC"] + + +# --------------------------------------------------------- +# Base Level: local file source mappings +# --------------------------------------------------------- + +SCOPUS_MAPPING = { + "Authors": "AU", + "Author full names": "AF", + "Title": "TI", + "Year": "PY", + "Source title": "SO", + "Volume": "VL", + "Issue": "IS", + "Page start": "BP", + "Page end": "EP", + "Cited by": "TC", + "DOI": "DI", + "Abstract": "AB", + "Author Keywords": "DE", + "Index Keywords": "ID", + "Affiliations": "C1", + "References": "CR", + "Document Type": "DT", + "Language of Original Document": "LA", + "EID": "UT" +} + +DIMENSIONS_MAPPING = { + "Title": "TI", + "Authors": "AU", + "Source title": "SO", + "Publication Year": "PY", + "DOI": "DI", + "Abstract": "AB", + "Times cited": "TC", + "Document Type": "DT", + "Volume": "VL", + "Issue": "IS", + "Pagination": "BP", + "Research Categories": "ID", + "MeSH terms": "DE", + "PubMed ID": "PMID", + "Dimensions ID": "UT" +} + +PUBMED_MAPPING = { + "PMID": "PMID", + "TI": "TI", + "AB": "AB", + "AU": "AU", + "FAU": "AF", + "JT": "SO", + "DP": "PY", + "LA": "LA", + "PT": "DT", + "AID": "DI", + "OT": "DE" +} + + +# --------------------------------------------------------- +# Advanced Level: API source mappings +# --------------------------------------------------------- + +OPENALEX_MAPPING = { + "id": "UT", + "doi": "DI", + "display_name": "TI", + "publication_year": "PY", + "cited_by_count": "TC", + "type": "DT", + "language": "LA", + "abstract": "AB", + "source": "SO", + "journal_abbreviation": "JI", + "authors": "AU", + "author_full_names": "AF", + "affiliations": "C1", + "keywords": "DE", + "concepts": "ID" +} + + +SOURCE_MAPPINGS = { + "SCOPUS": SCOPUS_MAPPING, + "DIMENSIONS": DIMENSIONS_MAPPING, + "PUBMED": PUBMED_MAPPING, + "OPENALEX": OPENALEX_MAPPING +} \ No newline at end of file diff --git a/www/services/bibliometrix_etl/src/transformer.py b/www/services/bibliometrix_etl/src/transformer.py new file mode 100644 index 000000000..b3eaf454b --- /dev/null +++ b/www/services/bibliometrix_etl/src/transformer.py @@ -0,0 +1,174 @@ +""" +Transformation module for the Bibliometrix ETL project. + +This module converts heterogeneous bibliographic data into a standardized +Web of Science-like schema required by Bibliometrix-Python. + +It performs: +1. Source-specific column mapping +2. Target column completion +3. Type normalization +4. Null handling +5. Short Reference (SR) generation +6. CSV-safe serialization +""" + +import pandas as pd + +from mappings import TARGET_COLUMNS, MULTI_VALUE_COLUMNS, INTEGER_COLUMNS, SOURCE_MAPPINGS +from utils import ( + clean_scalar, + clean_int, + split_multi_value, + serialize_list, + normalize_doi, + extract_openalex_id, + extract_year, + generate_sr +) + + +def rename_columns_to_wos(raw_df: pd.DataFrame, source: str) -> pd.DataFrame: + """ + Rename source-specific raw columns into WoS-like standard field tags. + + Example: + Title -> TI + Authors -> AU + DOI -> DI + """ + source = source.upper() + + if source not in SOURCE_MAPPINGS: + raise ValueError(f"Unsupported source: {source}") + + mapping = SOURCE_MAPPINGS[source] + + renamed_df = raw_df.rename(columns=mapping) + + return renamed_df + + +def add_missing_target_columns(df: pd.DataFrame) -> pd.DataFrame: + """ + Ensure all required target columns exist. + + If a source does not provide a field, the column is still created. + """ + for column in TARGET_COLUMNS: + if column not in df.columns: + df[column] = "" + + return df + + +def normalize_types(df: pd.DataFrame, source: str) -> pd.DataFrame: + """ + Enforce strong type contracts. + + - Multi-value fields become list[str] + - TC becomes int + - Scalar fields become clean strings + - DOI is normalized + - PY is converted into 4-digit year string + """ + source = source.upper() + + df["DB"] = source + + for column in TARGET_COLUMNS: + if column in MULTI_VALUE_COLUMNS: + df[column] = df[column].apply(split_multi_value) + + elif column in INTEGER_COLUMNS: + df[column] = df[column].apply(clean_int) + + else: + df[column] = df[column].apply(clean_scalar) + + # Special cleaning + df["DI"] = df["DI"].apply(normalize_doi) + df["PY"] = df["PY"].apply(extract_year) + + if source == "OPENALEX": + df["UT"] = df["UT"].apply(extract_openalex_id) + + return df + + +def generate_required_fields(df: pd.DataFrame) -> pd.DataFrame: + """ + Generate calculated fields required by Bibliometrix. + + Currently generates: + - SR: Short Reference + """ + rows = [] + + for _, row in df.iterrows(): + row_dict = row.to_dict() + row_dict["SR"] = generate_sr(row_dict) + rows.append(row_dict) + + return pd.DataFrame(rows) + + +def keep_target_schema_only(df: pd.DataFrame) -> pd.DataFrame: + """ + Keep only the standard target columns in the final order. + """ + return df[TARGET_COLUMNS] + + +def transform_to_wos(raw_df: pd.DataFrame, source: str) -> pd.DataFrame: + """ + Complete transformation pipeline. + + This function transforms raw extracted data into the final standardized + WoS-like schema. + + Parameters + ---------- + raw_df: + Raw DataFrame extracted from local files or API. + + source: + Source name such as SCOPUS, DIMENSIONS, PUBMED, or OPENALEX. + + Returns + ------- + pandas.DataFrame + Standardized DataFrame with target WoS-like columns. + """ + df = rename_columns_to_wos(raw_df, source) + df = add_missing_target_columns(df) + df = normalize_types(df, source) + df = generate_required_fields(df) + df = add_missing_target_columns(df) + df = keep_target_schema_only(df) + + return df + + +def prepare_for_csv(df: pd.DataFrame) -> pd.DataFrame: + """ + Convert list fields into semicolon-delimited strings for CSV export. + + Internally, multi-value fields are list[str]. + For flat CSV export, they are serialized using semicolon (;). + """ + csv_df = df.copy() + + for column in MULTI_VALUE_COLUMNS: + csv_df[column] = csv_df[column].apply(serialize_list) + + return csv_df + + +def save_standardized_csv(df: pd.DataFrame, output_path: str) -> None: + """ + Save standardized DataFrame into a CSV file. + """ + csv_df = prepare_for_csv(df) + csv_df.to_csv(output_path, index=False, encoding="utf-8-sig") + print(f"Saved standardized CSV: {output_path}") \ No newline at end of file diff --git a/www/services/bibliometrix_etl/src/utils.py b/www/services/bibliometrix_etl/src/utils.py new file mode 100644 index 000000000..458d1b55c --- /dev/null +++ b/www/services/bibliometrix_etl/src/utils.py @@ -0,0 +1,202 @@ +""" +Utility functions for the Bibliometrix ETL project. + +These helper functions are used by the extraction and transformation modules. +They clean missing values, split multi-value fields, normalize DOI values, +reconstruct OpenAlex abstracts, and generate short references. +""" + +import math +import re +from typing import Any, List + + +def is_missing(value: Any) -> bool: + """ + Check whether a value is missing. + + Handles None, NaN, and empty strings. + """ + if value is None: + return True + + if isinstance(value, float) and math.isnan(value): + return True + + if isinstance(value, str) and value.strip() == "": + return True + + return False + + +def clean_scalar(value: Any) -> str: + """ + Convert a scalar value into a clean string. + + Missing values are converted to an empty string. + """ + if is_missing(value): + return "" + + return str(value).strip() + + +def clean_int(value: Any) -> int: + """ + Convert a value into an integer. + + Missing or invalid values are converted to 0. + """ + if is_missing(value): + return 0 + + try: + return int(float(value)) + except Exception: + return 0 + + +def normalize_doi(value: Any) -> str: + """ + Normalize DOI values. + + Examples: + - https://doi.org/10.1234/example -> 10.1234/example + - doi:10.1234/example -> 10.1234/example + """ + doi = clean_scalar(value) + + if doi == "": + return "" + + doi = doi.replace("https://doi.org/", "") + doi = doi.replace("http://doi.org/", "") + doi = doi.replace("doi:", "") + doi = doi.replace("DOI:", "") + + return doi.strip() + + +def split_multi_value(value: Any) -> List[str]: + """ + Convert a raw multi-value field into a list of strings. + + Bibliometrix fields such as AU, AF, C1, CR, DE, and ID should behave + like list[str] inside the pipeline. + + For CSV export, these lists will later be serialized using semicolon (;). + """ + if is_missing(value): + return [] + + if isinstance(value, list): + return [str(v).strip() for v in value if not is_missing(v)] + + text = str(value).strip() + + if text == "": + return [] + + # Common bibliographic delimiters + delimiters = [";", "|", "\n"] + + for delimiter in delimiters: + if delimiter in text: + return [item.strip() for item in text.split(delimiter) if item.strip()] + + # If no delimiter exists, return one-item list + return [text] + + +def serialize_list(value: Any) -> str: + """ + Convert list values into semicolon-delimited strings for CSV output. + """ + if is_missing(value): + return "" + + if isinstance(value, list): + return "; ".join([str(v).strip() for v in value if str(v).strip()]) + + return str(value).strip() + + +def reconstruct_openalex_abstract(inverted_index: Any) -> str: + """ + Reconstruct an OpenAlex abstract from abstract_inverted_index. + + OpenAlex stores abstracts as: + { + "word": [position1, position2] + } + + This function converts that structure into normal text. + """ + if not isinstance(inverted_index, dict): + return "" + + position_to_word = {} + + for word, positions in inverted_index.items(): + if isinstance(positions, list): + for position in positions: + position_to_word[position] = word + + words = [position_to_word[i] for i in sorted(position_to_word.keys())] + + return " ".join(words) + + +def extract_openalex_id(value: Any) -> str: + """ + Extract only the OpenAlex work ID from a full OpenAlex URL. + + Example: + https://openalex.org/W123456789 -> W123456789 + """ + text = clean_scalar(value) + + if text == "": + return "" + + return text.rstrip("/").split("/")[-1] + + +def extract_year(value: Any) -> str: + """ + Extract a 4-digit publication year from a value. + """ + text = clean_scalar(value) + + match = re.search(r"\b(19|20)\d{2}\b", text) + + if match: + return match.group(0) + + return "" + + +def generate_sr(row: dict) -> str: + """ + Generate a short reference field. + + SR usually combines: + First Author + Publication Year + Source Title + + Example: + Smith, 2024, Nature + """ + authors = row.get("AU", []) + year = clean_scalar(row.get("PY", "")) + source = clean_scalar(row.get("SO", "")) + + first_author = "" + + if isinstance(authors, list) and len(authors) > 0: + first_author = clean_scalar(authors[0]) + else: + first_author = clean_scalar(authors) + + parts = [part for part in [first_author, year, source] if part != ""] + + return ", ".join(parts) \ No newline at end of file diff --git a/www/services/bibliometrix_etl/src/validator.py b/www/services/bibliometrix_etl/src/validator.py new file mode 100644 index 000000000..bb3fdd55a --- /dev/null +++ b/www/services/bibliometrix_etl/src/validator.py @@ -0,0 +1,111 @@ +""" +Validation module for the Bibliometrix ETL project. + +This module checks whether the transformed DataFrame follows the required +WoS-like schema expected by Bibliometrix-Python. +""" + +from typing import List +import pandas as pd + +from mappings import TARGET_COLUMNS, MULTI_VALUE_COLUMNS + + +def validate_required_columns(df: pd.DataFrame) -> List[str]: + """ + Check whether all required target columns exist. + """ + errors = [] + + for column in TARGET_COLUMNS: + if column not in df.columns: + errors.append(f"Missing required column: {column}") + + return errors + + +def validate_no_null_values(df: pd.DataFrame) -> List[str]: + """ + Check whether the final DataFrame contains NaN/None values. + """ + errors = [] + + null_counts = df.isnull().sum() + + for column, count in null_counts.items(): + if count > 0: + errors.append(f"Column {column} contains {count} null values") + + return errors + + +def validate_multi_value_columns(df: pd.DataFrame) -> List[str]: + """ + Check whether multi-value fields are lists before CSV serialization. + """ + errors = [] + + for column in MULTI_VALUE_COLUMNS: + if column not in df.columns: + continue + + invalid_count = 0 + + for value in df[column]: + if not isinstance(value, list): + invalid_count += 1 + + if invalid_count > 0: + errors.append( + f"Column {column} has {invalid_count} non-list values" + ) + + return errors + + +def validate_dataframe(df: pd.DataFrame) -> List[str]: + """ + Run all validation checks. + """ + errors = [] + + errors.extend(validate_required_columns(df)) + errors.extend(validate_no_null_values(df)) + errors.extend(validate_multi_value_columns(df)) + + return errors + + +def save_validation_report(errors: List[str], output_path: str) -> None: + """ + Save validation results into a text file. + """ + with open(output_path, "w", encoding="utf-8") as file: + file.write("Bibliometrix ETL Validation Report\n") + file.write("=================================\n\n") + + if not errors: + file.write("STATUS: PASSED\n") + file.write("No validation errors found.\n") + else: + file.write("STATUS: FAILED\n") + file.write("Validation errors:\n\n") + + for error in errors: + file.write(f"- {error}\n") + + print(f"Saved validation report: {output_path}") + + +def print_validation_result(errors: List[str]) -> None: + """ + Print validation result in terminal. + """ + print("\n========== VALIDATION RESULT ==========") + + if not errors: + print("PASSED: Standardized data is valid.") + else: + print("FAILED: Validation errors found.") + for error in errors: + print("-", error) \ No newline at end of file