diff --git a/.DS_Store b/.DS_Store
new file mode 100644
index 000000000..ac04fb02c
Binary files /dev/null and b/.DS_Store differ
diff --git a/.gitignore b/.gitignore
index 23b99e089..eda5fea88 100644
--- a/.gitignore
+++ b/.gitignore
@@ -1,4 +1,11 @@
 __pycache__/
 bibliovenv/
 Bibenv/
-.idea/
\ No newline at end of file
+.idea/.DS_Store
+*.bak
+all_code.txt
+venv/
+__pycache__/
+*.pyc
+*.rda
+*.rdata
diff --git a/analysis.py b/analysis.py
new file mode 100644
index 000000000..e69de29bb
diff --git a/app.py b/app.py
index f0891f894..ef94f8a63 100644
--- a/app.py
+++ b/app.py
@@ -667,7 +667,8 @@ def select_db():
                                     "dimensions": "Dimensions",
                                     "lens": "Lens.org",
                                     "pubmed": "PubMed",
-                                    "cochrane": "Cochrane Library"
+                                    "cochrane": "Cochrane Library",
+                                    "openalex": "OpenAlex"
                                 },
                             )
                             ui.input_select(
@@ -868,7 +869,7 @@ def indicator_types_ui_all():
 
             @reactive.calc
             def filters():
-                return get_filters(df)
+                return get_filters(df.get())
             
             with ui.layout_sidebar(fillable=False, fill=False):
                 # Sidebar for data import options
@@ -886,9 +887,9 @@ def show_filter():
                             "Select Year Range", 
                             sep="", 
                             ticks=True, 
-                            min=data["Min_Year"][0], 
-                            max=data["Max_Year"][0], 
-                            value=(data["Min_Year"][0], data["Max_Year"][0]), 
+                            min=data["Min_Year"].iloc[0], 
+                            max=data["Max_Year"].iloc[0], 
+                            value=(data["Min_Year"].iloc[0], data["Max_Year"].iloc[0]), 
                             step=1, 
                             time_format="YYYY"
                         )
@@ -988,7 +989,7 @@ def show_main_information_report():
                             "Average citations per doc"
                         ],
                         "Value": [
-                            f"{data['Min_Year'][0]} - {data['Max_Year'][0]}",
+                            f"{data['Min_Year'].iloc[0]} - {data['Max_Year'].iloc[0]}",
                             data['SO'].nunique(),
                             len(data),
                             data['CAGR'][0],
@@ -1060,7 +1061,7 @@ def loading_modal():
                     return ui.HTML(str(modal) + js)
                 ui.modal_show(loading_modal())
                 try:
-                    result = get_main_informations(df)
+                    result = get_main_informations(df.get())
                     return result
                 finally:
                     ui.modal_remove()
@@ -1077,7 +1078,7 @@ def show_informations():
                                 with ui.value_box(showcase=ICONS["timespan"], theme="bg-gradient-blue-purple"):
                                     "Timespan"
                                     ui.h2(
-                                        f"{data['Min_Year'][0]} - {data['Max_Year'][0]}"
+                                        f"{data['Min_Year'].iloc[0]} - {data['Max_Year'].iloc[0]}"
                                     )
                                 with ui.value_box(showcase=ICONS["sources"], theme="bg-gradient-blue-purple"):
                                     "Sources"
@@ -1160,7 +1161,7 @@ def table_informations():
                                         "Average citations per doc"
                                     ],
                                     "Value": [
-                                        f"{data['Min_Year'][0]} - {data['Max_Year'][0]}",
+                                        f"{data['Min_Year'].iloc[0]} - {data['Max_Year'].iloc[0]}",
                                         data['SO'].nunique(),
                                         len(data),
                                         data['CAGR'][0],
@@ -1174,7 +1175,7 @@ def table_informations():
                                         data['Average_Citations_per_Doc'][0]
                                     ]
                                 })
-                                return ui.HTML(DT(df_box, style="width=100%;"))
+                                return ui.HTML(DT(df_box, style="width:100%;"))
         
         # --- Annual Scientific Production Section ---
         with ui.nav_panel("None", value="annual_scientific_production"):
@@ -1215,7 +1216,7 @@ def show_annual_production_report():
             with ui.card(full_screen=True):
                 @reactive.calc
                 def annual_informations():
-                    return get_annual_production(df)
+                    return get_annual_production(df.get())
 
                 with ui.navset_underline(id="annual_tab"):
                     with ui.nav_panel("Plot"):
@@ -1228,7 +1229,7 @@ def show_annual_production():
                         @render.ui
                         def table_annual_production():
                             _, publications_per_year = annual_informations()
-                            return ui.HTML(DT(publications_per_year, style="width=100%;"))
+                            return ui.HTML(DT(publications_per_year, style="width:100%;"))
 
             # AI bot Gemini Chat Integration
             # --- Floating Chat Button ---
@@ -1369,7 +1370,7 @@ def show_average_citations_report():
             with ui.card(full_screen=True):
                 @reactive.calc
                 def average_citations():
-                    return get_average_citations(df)
+                    return get_average_citations(df.get())
 
                 with ui.navset_underline(id="average_tab"):
                     with ui.nav_panel("Plot"):
@@ -1382,7 +1383,7 @@ def show_average_citations():
                         @render.ui
                         def table_average_citations():
                             _, avg_citations = average_citations()
-                            return ui.HTML(DT(avg_citations, style="width=100%;"))
+                            return ui.HTML(DT(avg_citations, style="width:100%;"))
         
         # --- Three-Field Plot Section ---
         with ui.nav_panel("None", value="three_field_plot"):
@@ -1467,7 +1468,7 @@ def calculate_three_field_plot():
                             middle_field_items = input.middle_field_items()
                             right_field_items = input.right_field_items()
 
-                            result = get_three_field_plot(df, left_field, middle_field, right_field, left_field_items, middle_field_items, right_field_items)
+                            result = get_three_field_plot(df.get(), left_field, middle_field, right_field, left_field_items, middle_field_items, right_field_items)
                             three_field_plot_results.set(result)
                         finally:
                             ui.modal_remove()
@@ -1601,7 +1602,7 @@ def loading_modal():
                         ui.modal_show(loading_modal())
                         try:
                             num_of_sources = input.num_of_sources()
-                            result = get_relevant_sources(df, num_of_sources)
+                            result = get_relevant_sources(df.get(), num_of_sources)
                             relevant_sources_results.set(result)
                         finally:
                             ui.modal_remove()
@@ -1636,7 +1637,7 @@ def table_relevant_sources():
                                         style="height: 400px; display: flex; flex-direction: column; justify-content: center; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
                                     )
                                 _, relevant_sources_tab = result
-                                return ui.HTML(DT(relevant_sources_tab, style="width=100%;"))
+                                return ui.HTML(DT(relevant_sources_tab, style="width:100%;"))
         
         # --- Most Local Cited Sources Section ---
         with ui.nav_panel("None", value="most_local_cited_sources"):
@@ -1745,7 +1746,7 @@ def loading_modal():
                         ui.modal_show(loading_modal())
                         try:
                             num_of_cited_sources = input.num_of_cited_sources()
-                            result = get_local_cited_sources(df, num_of_cited_sources)
+                            result = get_local_cited_sources(df.get(), num_of_cited_sources)
                             local_cited_sources_results.set(result)
                         finally:
                             ui.modal_remove()
@@ -1780,7 +1781,7 @@ def table_local_cited_sources():
                                         style="height: 400px; display: flex; flex-direction: column; justify-content: center; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
                                     )
                                 _, local_cited_sources_tab = result
-                                return ui.HTML(DT(local_cited_sources_tab, style="width=100%;"))
+                                return ui.HTML(DT(local_cited_sources_tab, style="width:100%;"))
         
         # --- Bradford's Law Section ---
         with ui.nav_panel("None", value="bradfords_law"):
@@ -1821,7 +1822,7 @@ def show_bradfords_law_report():
             with ui.card(full_screen=True):
                 @reactive.calc
                 def bradford_law():
-                    return get_bradford_law(df)
+                    return get_bradford_law(df.get())
 
                 with ui.navset_underline(id="bradford_law_tab"):
                     with ui.nav_panel("Plot"):
@@ -1834,7 +1835,7 @@ def show_bradford_law():
                         @render.ui
                         def table_bradford_law():
                             _, bradford_law_tab = bradford_law()
-                            return ui.HTML(DT(bradford_law_tab, style="width=100%;"))
+                            return ui.HTML(DT(bradford_law_tab, style="width:100%;"))
         
         # --- Sources' Local Impact Section ---
         with ui.nav_panel("None", value="sources_local_impact"):
@@ -1945,7 +1946,7 @@ def loading_modal():
                         try:
                             num_of_sources_local_impact = input.num_of_sources_local_impact()
                             source_local_impact = input.source_local_impact()
-                            result = get_sources_local_impact(df, num_of_sources_local_impact, source_local_impact)
+                            result = get_sources_local_impact(df.get(), num_of_sources_local_impact, source_local_impact)
                             sources_local_impact_results.set(result)
                         finally:
                             ui.modal_remove()
@@ -1980,7 +1981,7 @@ def table_sources_local_impact():
                                         style="height: 400px; display: flex; flex-direction: column; justify-content: center; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
                                     )
                                 _, sources_local_impact_tab = result
-                                return ui.HTML(DT(sources_local_impact_tab, style="width=100%;"))
+                                return ui.HTML(DT(sources_local_impact_tab, style="width:100%;"))
         
         # --- Sources' Production ---
         with ui.nav_panel("None", value="sources_production"):
@@ -2080,7 +2081,7 @@ def loading_modal():
                 try:
                     num_of_sources_production = input.num_of_sources_production()
                     occurences = input.occurences()
-                    result = get_sources_production(df, num_of_sources_production, occurences)
+                    result = get_sources_production(df.get(), num_of_sources_production, occurences)
                     sources_production_result.set(result)
                 finally:
                     ui.modal_remove()
@@ -2126,7 +2127,7 @@ def table_sources_production():
                                         style="height: 400px; display: flex; flex-direction: column; justify-content: center; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
                                     )
                                 _, sources_production_tab = result
-                                return ui.HTML(DT(sources_production_tab, style="width=100%;"))
+                                return ui.HTML(DT(sources_production_tab, style="width:100%;"))
         
         # --- Most Relevant Authors Section ---
         with ui.nav_panel("None", value="most_relevant_authors"):
@@ -2227,7 +2228,7 @@ def loading_modal():
                 try:
                     num_of_authors = input.num_of_authors()
                     frequency = input.frequency()
-                    result = get_relevant_authors(df, num_of_authors, frequency)
+                    result = get_relevant_authors(df.get(), num_of_authors, frequency)
                     relevant_authors_result.set(result)
                 finally:
                     ui.modal_remove()
@@ -2273,7 +2274,7 @@ def table_relevant_authors():
                                         style="height: 400px; display: flex; flex-direction: column; justify-content: center; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
                                     )
                                 _, relevant_authors_tab = result
-                                return ui.HTML(DT(relevant_authors_tab, style="width=100%;"))
+                                return ui.HTML(DT(relevant_authors_tab, style="width:100%;"))
         
         # --- Most Local Cited Authors Section ---
         with ui.nav_panel("None", value="most_local_cited_authors"):
@@ -2376,7 +2377,7 @@ def loading_modal():
                 ui.modal_show(loading_modal())
                 try:
                     num_of_cited_authors = input.num_of_cited_authors()
-                    result = get_local_cited_authors(df, num_of_cited_authors)
+                    result = get_local_cited_authors(df.get(), num_of_cited_authors)
                     local_cited_authors_result.set(result)
                 finally:
                     ui.modal_remove()
@@ -2421,7 +2422,7 @@ def table_local_cited_authors():
                                         style="height: 400px; display: flex; flex-direction: column; justify-content: center; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
                                     )
                                 _, local_cited_authors_tab = result
-                                return ui.HTML(DT(local_cited_authors_tab, style="width=100%;"))
+                                return ui.HTML(DT(local_cited_authors_tab, style="width:100%;"))
         
         # --- Authors' Production over Time Section ---
         with ui.nav_panel("None", value="authors_production"):
@@ -2521,7 +2522,7 @@ def loading_modal():
                 ui.modal_show(loading_modal())
                 try:
                     top_k_authors = input.TopAuthorsProdK()
-                    result = get_author_production_over_time(df, top_k_authors)
+                    result = get_author_production_over_time(df.get(), top_k_authors)
                     au_over_time_result.set(result)
                 finally:
                     ui.modal_remove()
@@ -2566,7 +2567,7 @@ def table_authors_production():
                                         style="height: 400px; display: flex; flex-direction: column; justify-content: center; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
                                     )
                                 _, table_authors_production, _ = result
-                                return ui.HTML(DT(table_authors_production, style="width=100%;"))
+                                return ui.HTML(DT(table_authors_production, style="width:100%;"))
 
                         with ui.nav_panel("Table - Documents"):
                             @render.ui
@@ -2584,7 +2585,7 @@ def table_documents():
                                     table_documents['DOI'] = table_documents['DOI'].apply(
                                         lambda x: f'<a href="https://doi.org/{x}" target="_blank">{x}</a>' if x != "N/A" else x
                                     )
-                                return ui.HTML(DT(table_documents, style="width=100%;"))
+                                return ui.HTML(DT(table_documents, style="width:100%;"))
                     # AI bot Gemini Chat Integration
             # --- Floating Chat Button ---
             @render.express()
@@ -2723,7 +2724,7 @@ def show_lotkas_law_report():
             with ui.card(full_screen=True):
                 @reactive.calc
                 def lotka_law():
-                    return get_lotka_law(df)
+                    return get_lotka_law(df.get())
 
                 with ui.navset_underline(id="lotka_law_tab"):
                     with ui.nav_panel("Plot"):
@@ -2736,7 +2737,7 @@ def show_lotka_law():
                         @render.ui
                         def table_lotka_law():
                             _, lotka_law_tab = lotka_law()
-                            return ui.HTML(DT(lotka_law_tab, style="width=100%;"))
+                            return ui.HTML(DT(lotka_law_tab, style="width:100%;"))
         
         # --- Authors' Local Impact Section ---
         with ui.nav_panel("None", value="authors_local_impact"):
@@ -2837,7 +2838,7 @@ def loading_modal():
                 try:
                     num_of_authors_local_impact = input.num_of_authors_local_impact()
                     author_local_impact = input.author_local_impact()
-                    result = get_authors_local_impact(df, num_of_authors_local_impact, author_local_impact)
+                    result = get_authors_local_impact(df.get(), num_of_authors_local_impact, author_local_impact)
                     authors_local_impact_result.set(result)
                 finally:
                     ui.modal_remove()
@@ -2883,7 +2884,7 @@ def table_authors_local_impact():
                                         style="height: 400px; display: flex; flex-direction: column; justify-content: center; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
                                     )
                                 _, authors_local_impact_tab = result
-                                return ui.HTML(DT(authors_local_impact_tab, style="width=100%;"))
+                                return ui.HTML(DT(authors_local_impact_tab, style="width:100%;"))
         
         # --- Most Relevant Affiliations Section ---
         with ui.nav_panel("None", value="most_relevant_affiliations"):
@@ -2984,7 +2985,7 @@ def loading_modal():
                 try:
                     num_of_affiliations = input.num_of_affiliations()
                     disambiguation = input.disambiguation()
-                    result = get_relevant_affiliations(df, num_of_affiliations, disambiguation)
+                    result = get_relevant_affiliations(df.get(), num_of_affiliations, disambiguation)
                     relevant_affiliations_result.set(result)
                 finally:
                     ui.modal_remove()
@@ -3030,7 +3031,7 @@ def table_relevant_affiliations():
                                         style="height: 400px; display: flex; flex-direction: column; justify-content: center; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
                                     )
                                 _, relevant_affiliations_tab = result
-                                return ui.HTML(DT(relevant_affiliations_tab, style="width=100%;"))
+                                return ui.HTML(DT(relevant_affiliations_tab, style="width:100%;"))
         
         # --- Affiliations' Production over Time Section ---
         with ui.nav_panel("None", value="affiliations_production"):
@@ -3137,7 +3138,7 @@ def loading_modal():
                         ui.modal_show(loading_modal())
                         try:
                             top_k_affiliations = input.TopAffProdK()
-                            result = get_affiliation_production_over_time(df, top_k_affiliations)
+                            result = get_affiliation_production_over_time(df.get(), top_k_affiliations)
                             affiliations_production_results.set(result)
                         finally:
                             ui.modal_remove()
@@ -3172,7 +3173,7 @@ def table_affiliations_production():
                                         style="height: 400px; display: flex; flex-direction: column; justify-content: center; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
                                     )
                                 _, table_affiliations_production = result
-                                return ui.HTML(DT(table_affiliations_production, style="width=100%;"))
+                                return ui.HTML(DT(table_affiliations_production, style="width:100%;"))
         
         # --- Affiliations' Local Impact Section ---
         with ui.nav_panel("None", value="corresponding_authors"):
@@ -3281,7 +3282,7 @@ def loading_modal():
                         ui.modal_show(loading_modal())
                         try:
                             top_k_countries = input.TopCountries()
-                            result = get_corresponding_author_countries(df, top_k_countries)
+                            result = get_corresponding_author_countries(df.get(), top_k_countries)
                             corresponding_authors_results.set(result)
                         finally:
                             ui.modal_remove()
@@ -3316,7 +3317,7 @@ def table_countries_collaboration():
                                         style="height: 400px; display: flex; flex-direction: column; justify-content: center; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
                                     )
                                 _, countries_table = result
-                                return ui.HTML(DT(countries_table, style="width=100%;"))
+                                return ui.HTML(DT(countries_table, style="width:100%;"))
         
         # --- Countries' Scientific Production Section ---
         with ui.nav_panel("None", value="countries_scientific_production"):
@@ -3406,7 +3407,7 @@ def loading_modal():
                     
                     ui.modal_show(loading_modal())
                     try:
-                        result = get_countries_production(df)
+                        result = get_countries_production(df.get())
                         return result
                     finally:
                         ui.modal_remove()
@@ -3422,7 +3423,7 @@ def show_countries_production():
                         @render.ui
                         def table_countries_production():
                             _, countries_table = countries_production()
-                            return ui.HTML(DT(countries_table, style="width=100%;"))
+                            return ui.HTML(DT(countries_table, style="width:100%;"))
 
         # --- Countries' Production over Time Section ---
         with ui.nav_panel("None", value="countries_production_over_time"):
@@ -3531,7 +3532,7 @@ def loading_modal():
                         ui.modal_show(loading_modal())
                         try:
                             top_k_countries = input.TopCountriesProdK()
-                            result = get_countries_production_over_time(df, top_k_countries)
+                            result = get_countries_production_over_time(df.get(), top_k_countries)
                             countries_over_time_results.set(result)
                         finally:
                             ui.modal_remove()
@@ -3566,7 +3567,7 @@ def table_countries_over_time():
                                         style="height: 400px; display: flex; flex-direction: column; justify-content: center; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
                                     )
                                 _, countries_table = result
-                                return ui.HTML(DT(countries_table, style="width=100%;"))
+                                return ui.HTML(DT(countries_table, style="width:100%;"))
         
         # --- Most Cited Countries Section ---
         with ui.nav_panel("None", value="most_cited_countries"):
@@ -3677,7 +3678,7 @@ def loading_modal():
                         try:
                             num_of_cited_countries = input.num_of_cited_countries()
                             cited_countries_measure = input.cited_countries()
-                            result = get_cited_countries(df, num_of_cited_countries, cited_countries_measure)
+                            result = get_cited_countries(df.get(), num_of_cited_countries, cited_countries_measure)
                             cited_countries_results.set(result)
                         finally:
                             ui.modal_remove()
@@ -3712,7 +3713,7 @@ def table_cited_countries():
                                         style="height: 400px; display: flex; flex-direction: column; justify-content: center; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
                                     )
                                 _, cited_countries_tab = result
-                                return ui.HTML(DT(cited_countries_tab, style="width=100%;"))
+                                return ui.HTML(DT(cited_countries_tab, style="width:100%;"))
         
         # --- Most Global Cited Documents Section ---
         with ui.nav_panel("None", value="most_global_cited_documents"):
@@ -3817,7 +3818,7 @@ def loading_modal():
                         try:
                             num_of_cited_docs = input.num_of_cited_docs()
                             cited_docs = input.cited_docs()
-                            result = get_cited_documents(df, num_of_cited_docs, cited_docs)
+                            result = get_cited_documents(df.get(), num_of_cited_docs, cited_docs)
                             cited_documents_results.set(result)
                         finally:
                             ui.modal_remove()
@@ -3852,7 +3853,7 @@ def table_cited_documents():
                                         style="height: 400px; display: flex; flex-direction: column; justify-content: center; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
                                     )
                                 _, cited_documents_tab = result
-                                return ui.HTML(DT(cited_documents_tab, style="width=100%;"))
+                                return ui.HTML(DT(cited_documents_tab, style="width:100%;"))
         
         # --- Most Local Cited Documents Section ---
         with ui.nav_panel("None", value="most_local_cited_documents"):
@@ -3964,7 +3965,7 @@ def loading_modal():
                             # Run analysis
                             num_of_local_cited_docs = input.num_of_local_cited_docs()
                             field_separator = input.field_separator()
-                            result = get_local_cited_documents(df, num_of_local_cited_docs, field_separator)
+                            result = get_local_cited_documents(df.get(), num_of_local_cited_docs, field_separator)
                             local_cited_documents_results.set(result)
                         finally:
                             ui.modal_remove()
@@ -3998,7 +3999,7 @@ def table_local_cited_documents():
                                         style="height: 400px; display: flex; flex-direction: column; justify-content: center; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
                                     )
                                 _, local_cited_documents_tab = result
-                                return ui.HTML(DT(local_cited_documents_tab, style="width=100%;"))
+                                return ui.HTML(DT(local_cited_documents_tab, style="width:100%;"))
         
         # --- Most Local Cited References Section ---
         with ui.nav_panel("None", value="most_local_cited_references"):
@@ -4110,7 +4111,7 @@ def loading_modal():
                             # Run analysis
                             num_of_cited_refs = input.num_of_cited_refs()
                             field_separator_ref = input.field_separator_ref()
-                            result = get_local_cited_refs(df, num_of_cited_refs, field_separator_ref)
+                            result = get_local_cited_refs(df.get(), num_of_cited_refs, field_separator_ref)
                             local_cited_refs_results.set(result)
                         finally:
                             ui.modal_remove()
@@ -4144,7 +4145,7 @@ def table_local_cited_refs():
                                         style="height: 400px; display: flex; flex-direction: column; justify-content: center; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
                                     )
                                 _, local_cited_refs_tab = result
-                                return ui.HTML(DT(local_cited_refs_tab, style="width=100%;"))
+                                return ui.HTML(DT(local_cited_refs_tab, style="width:100%;"))
         
         # --- References Spectroscopy Section ---
         with ui.nav_panel("None", value="references_spectroscopy"):
@@ -4260,7 +4261,7 @@ def loading_modal():
                             start_year = input.start_year()
                             end_year = input.end_year()
                             field_separator_spec = input.field_separator_spec()
-                            result = get_references_spectroscopy(df, start_year, end_year, field_separator_spec)
+                            result = get_references_spectroscopy(df.get(), start_year, end_year, field_separator_spec)
                             ref_spectroscopy_results.set(result)
                         finally:
                             ui.modal_remove()
@@ -4294,7 +4295,7 @@ def table_references_rpy():
                                         style="height: 400px; display: flex; flex-direction: column; justify-content: center; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
                                     )
                                 _, ref_rpy_tab, _ = result
-                                return ui.HTML(DT(ref_rpy_tab, style="width=100%;"))
+                                return ui.HTML(DT(ref_rpy_tab, style="width:100%;"))
 
                         with ui.nav_panel("Table - Cited References"):
                             @render.ui
@@ -4306,7 +4307,7 @@ def table_references_spectroscopy():
                                         style="height: 400px; display: flex; flex-direction: column; justify-content: center; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
                                     )
                                 _, _, ref_spectroscopy_tab = result
-                                return ui.HTML(DT(ref_spectroscopy_tab, style="width=100%;"))
+                                return ui.HTML(DT(ref_spectroscopy_tab, style="width:100%;"))
 
         # --- Most Frequent Words ---
         with ui.nav_panel("None", value="most_frequent_words"):
@@ -4470,7 +4471,7 @@ def loading_modal():
                                 file_upload_synonyms_mfw = None
                                 synonyms_data_mfw = None
 
-                            result = get_frequent_words(df, ngram_mfw, num_of_words_mfw, field_mfw, file_upload_terms_mfw, file_upload_synonyms_mfw)
+                            result = get_frequent_words(df.get(), ngram_mfw, num_of_words_mfw, field_mfw, file_upload_terms_mfw, file_upload_synonyms_mfw)
                             frequent_words_results.set(result)
                         except Exception as e:
                             ui.notification_show(f"❌ Error in analysis: {str(e)}", type="error", duration=10)
@@ -4524,7 +4525,7 @@ def table_frequent_words():
                                         style="height: 400px; display: flex; flex-direction: column; justify-content: center; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
                                     )
                                 _, frequent_words_tab = result
-                                return ui.HTML(DT(frequent_words_tab, style="width=100%;"))
+                                return ui.HTML(DT(frequent_words_tab, style="width:100%;"))
         
         # --- WordCloud Section ---
         with ui.nav_panel("None", value="wordcloud"):
@@ -4688,7 +4689,7 @@ def loading_modal():
                                 file_upload_synonyms_wc = None
                                 synonyms_data_wc = None
 
-                            result = get_wordcloud(df, ngram_wc, num_of_words_wc, field_wc, file_upload_terms_wc, file_upload_synonyms_wc)
+                            result = get_wordcloud(df.get(), ngram_wc, num_of_words_wc, field_wc, file_upload_terms_wc, file_upload_synonyms_wc)
                             wordcloud_results.set(result)
                         except Exception as e:
                             ui.notification_show(f"❌ Error in analysis: {str(e)}", type="error", duration=10)
@@ -4742,7 +4743,7 @@ def table_wordcloud():
                                         style="height: 400px; display: flex; flex-direction: column; justify-content: center; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
                                     )
                                 _, wordcloud_tab = result
-                                return ui.HTML(DT(wordcloud_tab, style="width=100%;"))
+                                return ui.HTML(DT(wordcloud_tab, style="width:100%;"))
         
         # --- TreeMap Section ---
         with ui.nav_panel("None", value="treemap"):
@@ -4906,7 +4907,7 @@ def loading_modal():
                                 file_upload_synonyms_tm = None
                                 synonyms_data_tm = None
 
-                            result = get_treemap(df, ngram_tm, num_of_words_tm, field_tm, file_upload_terms_tm, file_upload_synonyms_tm)
+                            result = get_treemap(df.get(), ngram_tm, num_of_words_tm, field_tm, file_upload_terms_tm, file_upload_synonyms_tm)
                             treemap_results.set(result)
                         except Exception as e:
                             ui.notification_show(f"❌ Error in analysis: {str(e)}", type="error", duration=10)
@@ -4960,7 +4961,7 @@ def table_treemap():
                                         style="height: 400px; display: flex; flex-direction: column; justify-content: center; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
                                     )
                                 _, treemap_tab = result
-                                return ui.HTML(DT(treemap_tab, style="width=100%;"))
+                                return ui.HTML(DT(treemap_tab, style="width:100%;"))
         
         # --- References Spectroscopy Section ---
         with ui.nav_panel("None", value="words_frequency_over_time"):
@@ -5127,7 +5128,7 @@ def loading_modal():
                                 file_upload_synonyms_wf = None
                                 synonyms_data_wf = None
 
-                            result = get_word_frequency(df, ngram_wf, field_wf, file_upload_terms_wf, file_upload_synonyms_wf, occurrences, top_words)
+                            result = get_word_frequency(df.get(), ngram_wf, field_wf, file_upload_terms_wf, file_upload_synonyms_wf, occurrences, top_words)
                             word_frequency_results.set(result)
                         except Exception as e:
                             ui.notification_show(f"❌ Error in analysis: {str(e)}", type="error", duration=10)
@@ -5244,7 +5245,7 @@ def get_ngrams_tt():
                         @render.express()
                         def show_timespan():
                             data_temp = main_informations()
-                            ui.input_slider("time_window", "Timespan", sep="", ticks=True, min=data_temp['Min_Year'][0], max=data_temp['Max_Year'][0], value=[data_temp['Min_Year'][0], data_temp['Max_Year'][0]], step=1, time_format="YYYY")
+                            ui.input_slider("time_window", "Timespan", sep="", ticks=True, min=data_temp["Min_Year"].iloc[0], max=data_temp["Max_Year"].iloc[0], value=[data_temp["Min_Year"].iloc[0], data_temp["Max_Year"].iloc[0]], step=1, time_format="YYYY")
 
                         with ui.accordion(id="acc_tt", multiple=True, open=False):
                             with ui.accordion_panel("Text Editing"):
@@ -5357,7 +5358,7 @@ def loading_modal():
                             word_mimimum_frequency = input.word_mimimum_frequency()
                             number_of_words_year = input.number_of_words_year()
 
-                            result = get_trend_topics(df, ngram_tt, field_tt, time_window, file_upload_terms_tt, file_upload_synonyms_tt, word_mimimum_frequency, number_of_words_year)
+                            result = get_trend_topics(df.get(), ngram_tt, field_tt, time_window, file_upload_terms_tt, file_upload_synonyms_tt, word_mimimum_frequency, number_of_words_year)
                             trend_topics_results.set(result)
                         except Exception as e:
                             ui.notification_show(f"❌ Error in analysis: {str(e)}", type="error", duration=10)
@@ -5561,7 +5562,7 @@ def loading_modal():
                             community_repulsion = input.community_repulsion()
                             clustering_algorithm = input.clustering_algorithm()
 
-                            result = get_clustering_coupling(df, unit_of_analysis, coupling_field, stemmer, impact_measure, cluster_labeling, ngram, num_of_units, min_cluster_freq, label_per_cluster, label_size, community_repulsion, clustering_algorithm)
+                            result = get_clustering_coupling(df.get(), unit_of_analysis, coupling_field, stemmer, impact_measure, cluster_labeling, ngram, num_of_units, min_cluster_freq, label_per_cluster, label_size, community_repulsion, clustering_algorithm)
                             clustering_coupling_results.set(result)
                         except Exception as e:
                             ui.notification_show(f"❌ Error in analysis: {str(e)}", type="error", duration=10)
@@ -5848,7 +5849,7 @@ def loading_modal():
                                 modal_content.append(ui.markdown("""<h3 style=\"text-align:center;\">Synonyms to Remove</h3>"""))
                                 modal_content.append(ui.HTML(DT(synonyms_data)))
 
-                            result = get_co_occurence_network(df, field_cn, ngram_cn, network_layout, clustering_algorithm_cn, normalization_cn, color_by_year, num_of_nodes, 
+                            result = get_co_occurence_network(df.get(), field_cn, ngram_cn, network_layout, clustering_algorithm_cn, normalization_cn, color_by_year, num_of_nodes, 
                                                             repulsion_force, remove_isolated, min_edges, node_opacity, num_of_labels, node_shape, label_size_ls,
                                                             edge_size, node_shadow, edit_nodes, label_cex, file_upload_terms, file_upload_synonyms)
                             co_occurrence_network_results.set(result)
@@ -5895,7 +5896,7 @@ def table_co_occurrence_network():
                                 result = co_occurrence_network_results.get()
                                 if result is not None:
                                     _, _, co_occurrence_network_tab, _ = result
-                                    return ui.HTML(DT(co_occurrence_network_tab, style="width=100%;"))
+                                    return ui.HTML(DT(co_occurrence_network_tab, style="width:100%;"))
                                 else:
                                     return ui.div(
                                         ui.p("Click the Run Analysis button to run co-occurrence network", style="text-align: center; color: #999; font-size: 16px;"),
@@ -6068,7 +6069,7 @@ def loading_modal():
                             cluster = input.thematic_clustering()
                             repulsion = input.thematic_repulsion()
 
-                            result = get_thematic_map(df, field, n, minfreq, ngram, stemming,
+                            result = get_thematic_map(df.get(), field, n, minfreq, ngram, stemming,
                                                     label_size, n_labels, repulsion, cluster)
                             thematic_map_results.set(result)
                         except Exception as e:
@@ -6116,7 +6117,7 @@ def table_thematic_map():
                                 result = thematic_map_results.get()
                                 if result is not None:
                                     _, _, thematic_map_table, _, _ = result
-                                    return ui.HTML(DT(thematic_map_table, style="width=100%;"))
+                                    return ui.HTML(DT(thematic_map_table, style="width:100%;"))
                                 else:
                                     return ui.div(
                                         ui.p("Click the Run Analysis button to run thematic map", style="text-align: center; color: #999; font-size: 16px;"),
@@ -6129,7 +6130,7 @@ def clusters_thematic_map():
                                 result = thematic_map_results.get()
                                 if result is not None:
                                     _, _, _, thematic_map_cluster, _ = result
-                                    return ui.HTML(DT(thematic_map_cluster, style="width=100%;"))
+                                    return ui.HTML(DT(thematic_map_cluster, style="width:100%;"))
                                 else:
                                     return ui.div(
                                         ui.p("Click the Run Analysis button to run thematic map", style="text-align: center; color: #999; font-size: 16px;"),
@@ -6142,7 +6143,7 @@ def documents_thematic_map():
                                 result = thematic_map_results.get()
                                 if result is not None:
                                     _, _, _, _, thematic_map_documents = result
-                                    return ui.HTML(DT(thematic_map_documents, maxBytes="10MB", style="width=100%;"))
+                                    return ui.HTML(DT(thematic_map_documents, maxBytes="10MB", style="width:100%;"))
                                 else:
                                     return ui.div(
                                         ui.p("Click the Run Analysis button to run thematic map", style="text-align: center; color: #999; font-size: 16px;"),
@@ -6403,7 +6404,7 @@ def loading_modal():
                             ngrams = input.thematic_evolution_ngram() if field in ["TI", "AB"] else 1
                             stemming = input.thematic_evolution_stemmer() if field in ["TI", "AB"] else False
 
-                            result = get_thematic_evolution(df, field, years, n, weight_index, min_weight_index, minfreq, label_size, ngrams, stemming, n_labels, overlap, remove_terms, synonyms, cluster)
+                            result = get_thematic_evolution(df.get(), field, years, n, weight_index, min_weight_index, minfreq, label_size, ngrams, stemming, n_labels, overlap, remove_terms, synonyms, cluster)
                             thematic_evolution_results.set(result)
                         except Exception as e:
                             ui.notification_show(f"❌ Error in analysis: {str(e)}", type="error", duration=10)
@@ -6444,7 +6445,7 @@ def table_thematic_evolution():
                                             result = thematic_evolution_results.get()
                                             if result is not None:
                                                 _, thematic_evolution_table, _ = result
-                                                return ui.HTML(DT(thematic_evolution_table, style="width=100%;"))
+                                                return ui.HTML(DT(thematic_evolution_table, style="width:100%;"))
                                             else:
                                                 return ui.div(
                                                     ui.p("Click the Run Analysis button to run thematic evolution", style="text-align: center; color: #999; font-size: 16px;"),
@@ -6483,7 +6484,7 @@ def table_thematic_evolution_2():
                                                 if result is not None:
                                                     _, _, TM = result
                                                     if len(TM) > 0:
-                                                        return ui.HTML(DT(TM[0]["words"], style="width=100%;"))
+                                                        return ui.HTML(DT(TM[0]["words"], style="width:100%;"))
                                                 return ui.div(
                                                     ui.p("Click the Run Analysis button to run thematic evolution", style="text-align: center; color: #999; font-size: 16px;"),
                                                     style="display: flex; flex-direction: column; justify-content: center; align-items: center; height: 300px; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
@@ -6496,7 +6497,7 @@ def clusters_thematic_evolution_2():
                                                 if result is not None:
                                                     _, _, TM = result
                                                     if len(TM) > 0:
-                                                        return ui.HTML(DT(TM[0]["clusters"], style="width=100%;"))
+                                                        return ui.HTML(DT(TM[0]["clusters"], style="width:100%;"))
                                                 return ui.div(
                                                     ui.p("Click the Run Analysis button to run thematic evolution", style="text-align: center; color: #999; font-size: 16px;"),
                                                     style="display: flex; flex-direction: column; justify-content: center; align-items: center; height: 300px; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
@@ -6509,7 +6510,7 @@ def documents_thematic_evolution_2():
                                                 if result is not None:
                                                     _, _, TM = result
                                                     if len(TM) > 0:
-                                                        return ui.HTML(DT(TM[0]["documentToClusters"], maxBytes="10MB", style="width=100%;"))
+                                                        return ui.HTML(DT(TM[0]["documentToClusters"], maxBytes="10MB", style="width:100%;"))
                                                 return ui.div(
                                                     ui.p("Click the Run Analysis button to run thematic evolution", style="text-align: center; color: #999; font-size: 16px;"),
                                                     style="display: flex; flex-direction: column; justify-content: center; align-items: center; height: 300px; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
@@ -6547,7 +6548,7 @@ def table_thematic_evolution_3():
                                                 if result is not None:
                                                     _, _, TM = result
                                                     if len(TM) > 1:
-                                                        return ui.HTML(DT(TM[1]["words"], style="width=100%;"))
+                                                        return ui.HTML(DT(TM[1]["words"], style="width:100%;"))
                                                 return ui.div(
                                                     ui.p("Click the Run Analysis button to run thematic evolution", style="text-align: center; color: #999; font-size: 16px;"),
                                                     style="display: flex; flex-direction: column; justify-content: center; align-items: center; height: 300px; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
@@ -6560,7 +6561,7 @@ def clusters_thematic_evolution_3():
                                                 if result is not None:
                                                     _, _, TM = result
                                                     if len(TM) > 1:
-                                                        return ui.HTML(DT(TM[1]["clusters"], style="width=100%;"))
+                                                        return ui.HTML(DT(TM[1]["clusters"], style="width:100%;"))
                                                 return ui.div(
                                                     ui.p("Click the Run Analysis button to run thematic evolution", style="text-align: center; color: #999; font-size: 16px;"),
                                                     style="display: flex; flex-direction: column; justify-content: center; align-items: center; height: 300px; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
@@ -6573,7 +6574,7 @@ def documents_thematic_evolution_3():
                                                 if result is not None:
                                                     _, _, TM = result
                                                     if len(TM) > 1:
-                                                        return ui.HTML(DT(TM[1]["documentToClusters"], maxBytes="10MB", style="width=100%;"))
+                                                        return ui.HTML(DT(TM[1]["documentToClusters"], maxBytes="10MB", style="width:100%;"))
                                                 return ui.div(
                                                     ui.p("Click the Run Analysis button to run thematic evolution", style="text-align: center; color: #999; font-size: 16px;"),
                                                     style="display: flex; flex-direction: column; justify-content: center; align-items: center; height: 300px; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
@@ -6611,7 +6612,7 @@ def table_thematic_evolution_4():
                                                 if result is not None:
                                                     _, _, TM = result
                                                     if len(TM) > 2:
-                                                        return ui.HTML(DT(TM[2]["words"], style="width=100%;"))
+                                                        return ui.HTML(DT(TM[2]["words"], style="width:100%;"))
                                                 return ui.div(
                                                     ui.p("Click the Run Analysis button to run thematic evolution", style="text-align: center; color: #999; font-size: 16px;"),
                                                     style="display: flex; flex-direction: column; justify-content: center; align-items: center; height: 300px; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
@@ -6624,7 +6625,7 @@ def clusters_thematic_evolution_4():
                                                 if result is not None:
                                                     _, _, TM = result
                                                     if len(TM) > 2:
-                                                        return ui.HTML(DT(TM[2]["clusters"], style="width=100%;"))
+                                                        return ui.HTML(DT(TM[2]["clusters"], style="width:100%;"))
                                                 return ui.div(
                                                     ui.p("Click the Run Analysis button to run thematic evolution", style="text-align: center; color: #999; font-size: 16px;"),
                                                     style="display: flex; flex-direction: column; justify-content: center; align-items: center; height: 300px; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
@@ -6637,7 +6638,7 @@ def documents_thematic_evolution_4():
                                                 if result is not None:
                                                     _, _, TM = result
                                                     if len(TM) > 2:
-                                                        return ui.HTML(DT(TM[2]["documentToClusters"], maxBytes="10MB", style="width=100%;"))
+                                                        return ui.HTML(DT(TM[2]["documentToClusters"], maxBytes="10MB", style="width:100%;"))
                                                 return ui.div(
                                                     ui.p("Click the Run Analysis button to run thematic evolution", style="text-align: center; color: #999; font-size: 16px;"),
                                                     style="display: flex; flex-direction: column; justify-content: center; align-items: center; height: 300px; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
@@ -6675,7 +6676,7 @@ def table_thematic_evolution_5():
                                                 if result is not None:
                                                     _, _, TM = result
                                                     if len(TM) > 3:
-                                                        return ui.HTML(DT(TM[3]["words"], style="width=100%;"))
+                                                        return ui.HTML(DT(TM[3]["words"], style="width:100%;"))
                                                 return ui.div(
                                                     ui.p("Click the Run Analysis button to run thematic evolution", style="text-align: center; color: #999; font-size: 16px;"),
                                                     style="display: flex; flex-direction: column; justify-content: center; align-items: center; height: 300px; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
@@ -6688,7 +6689,7 @@ def clusters_thematic_evolution_5():
                                                 if result is not None:
                                                     _, _, TM = result
                                                     if len(TM) > 3:
-                                                        return ui.HTML(DT(TM[3]["clusters"], style="width=100%;"))
+                                                        return ui.HTML(DT(TM[3]["clusters"], style="width:100%;"))
                                                 return ui.div(
                                                     ui.p("Click the Run Analysis button to run thematic evolution", style="text-align: center; color: #999; font-size: 16px;"),
                                                     style="display: flex; flex-direction: column; justify-content: center; align-items: center; height: 300px; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
@@ -6701,7 +6702,7 @@ def documents_thematic_evolution_5():
                                                 if result is not None:
                                                     _, _, TM = result
                                                     if len(TM) > 3:
-                                                        return ui.HTML(DT(TM[3]["documentToClusters"], maxBytes="10MB", style="width=100%;"))
+                                                        return ui.HTML(DT(TM[3]["documentToClusters"], maxBytes="10MB", style="width:100%;"))
                                                 return ui.div(
                                                     ui.p("Click the Run Analysis button to run thematic evolution", style="text-align: center; color: #999; font-size: 16px;"),
                                                     style="display: flex; flex-direction: column; justify-content: center; align-items: center; height: 300px; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
@@ -6739,7 +6740,7 @@ def table_thematic_evolution_6():
                                                 if result is not None:
                                                     _, _, TM = result
                                                     if len(TM) > 4:
-                                                        return ui.HTML(DT(TM[4]["words"]), style="width=100%;")
+                                                        return ui.HTML(DT(TM[4]["words"]), style="width:100%;")
                                                 return ui.div(
                                                     ui.p("Click the Run Analysis button to run thematic evolution", style="text-align: center; color: #999; font-size: 16px;"),
                                                     style="display: flex; flex-direction: column; justify-content: center; align-items: center; height: 300px; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
@@ -6752,7 +6753,7 @@ def clusters_thematic_evolution_6():
                                                 if result is not None:
                                                     _, _, TM = result
                                                     if len(TM) > 4:
-                                                        return ui.HTML(DT(TM[4]["clusters"], style="width=100%;"))
+                                                        return ui.HTML(DT(TM[4]["clusters"], style="width:100%;"))
                                                 return ui.div(
                                                     ui.p("Click the Run Analysis button to run thematic evolution", style="text-align: center; color: #999; font-size: 16px;"),
                                                     style="display: flex; flex-direction: column; justify-content: center; align-items: center; height: 300px; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
@@ -6765,7 +6766,7 @@ def documents_thematic_evolution_6():
                                                 if result is not None:
                                                     _, _, TM = result
                                                     if len(TM) > 4:
-                                                        return ui.HTML(DT(TM[4]["documentToClusters"], maxBytes="10MB", style="width=100%;"))
+                                                        return ui.HTML(DT(TM[4]["documentToClusters"], maxBytes="10MB", style="width:100%;"))
                                                 return ui.div(
                                                     ui.p("Click the Run Analysis button to run thematic evolution", style="text-align: center; color: #999; font-size: 16px;"),
                                                     style="display: flex; flex-direction: column; justify-content: center; align-items: center; height: 300px; border: 2px dashed #ddd; border-radius: 10px; margin: 20px;"
@@ -6995,7 +6996,7 @@ def loading_modal():
                                 labelsize=input.wordmap_labelsize()
                                 size=input.wordmap_dot_size()
 
-                                result = get_factorial_analysis(df, ngram, field, terms_data_wm, synonyms_data_wm, n_terms, n_clusters, num_documents, method, dimX, dimY, topWordPlot, threshold, labelsize, size)
+                                result = get_factorial_analysis(df.get(), ngram, field, terms_data_wm, synonyms_data_wm, n_terms, n_clusters, num_documents, method, dimX, dimY, topWordPlot, threshold, labelsize, size)
                                 factorial_analysis_results.set(result)
                             except Exception as e:
                                 ui.notification_show(f"❌ Error in analysis: {str(e)}", type="error", duration=10)
@@ -7051,7 +7052,7 @@ def show_words_by_cluster():
                                 result = factorial_analysis_results.get()
                                 if result is not None:
                                     _, _, words_by_cluster, _ = result
-                                    return ui.HTML(DT(words_by_cluster, style="width=100%;"))
+                                    return ui.HTML(DT(words_by_cluster, style="width:100%;"))
                                 else:
                                     return ui.div(
                                         ui.p("Click the Run Analysis button to run factorial analysis", style="text-align: center; color: #999; font-size: 16px;"),
@@ -7064,7 +7065,7 @@ def show_articles_by_cluster():
                                 result = factorial_analysis_results.get()
                                 if result is not None:
                                     _, _, _, articles_by_cluster = result
-                                    return ui.HTML(DT(articles_by_cluster, style="width=100%;"))
+                                    return ui.HTML(DT(articles_by_cluster, style="width:100%;"))
                                 else:
                                     return ui.div(
                                         ui.p("Click the Run Analysis button to run factorial analysis", style="text-align: center; color: #999; font-size: 16px;"),
@@ -7186,7 +7187,7 @@ def loading_modal():
                             
                             # Execute analysis
                             result = get_co_citation(
-                                df=df,
+                                df=df.get(),
                                 field=field,
                                 sep=sep,
                                 cocit_network_layout=cocit_network_layout,
@@ -7345,7 +7346,7 @@ def show_cocitation_table():
                                 result = co_citation_network_results.get()
                                 if result is not None:
                                     _, _, cocit_table, _ = result
-                                    return ui.HTML(DT(cocit_table, style="width=100%;"))
+                                    return ui.HTML(DT(cocit_table, style="width:100%;"))
                                 else:
                                     return ui.div(
                                         ui.p("Click the Run Analysis button to generate the co-citation table.", style="text-align: center; color: #666; font-size: 16px;"),
@@ -7474,7 +7475,7 @@ def loading_modal():
                             histsize = input.histsize()
                             # Execute analysis with correct parameters
                             result = get_historiograph(
-                                df=df,
+                                df=df.get(),
                                 node_label="AU1",
                                 histNodes=histNodes,
                                 hist_isolates=True,
@@ -7560,7 +7561,7 @@ def show_hist_table():
                                 result = historiograph_results.get()
                                 if result is not None:
                                     _, hist_tab, _ = result
-                                    return ui.HTML(DT(hist_tab, style="width=100%;"))
+                                    return ui.HTML(DT(hist_tab, style="width:100%;"))
                                 else:
                                     return ui.div(
                                         ui.p("Click the Run Analysis button to generate the historiograph table.", style="text-align: center; color: #666; font-size: 16px;"),
@@ -7690,7 +7691,7 @@ def loading_modal():
                             
                             # Execute analysis
                             result = get_collaboration_network(
-                                df=df,
+                                df=df.get(),
                                 field=field,
                                 network_layout=network_layout,
                                 clustering_algorithm=clustering_algorithm,
@@ -7865,7 +7866,7 @@ def show_collaboration_table():
                                 result = collaboration_network_results.get()
                                 if result is not None:
                                     _, _, collab_table, _ = result
-                                    return ui.HTML(DT(collab_table, style="width=100%;"))
+                                    return ui.HTML(DT(collab_table, style="width:100%;"))
                                 else:
                                     return ui.div(
                                         ui.p("Click the Run Analysis button to generate the collaboration table.", style="text-align: center; color: #666; font-size: 16px;"),
@@ -7987,7 +7988,7 @@ def loading_modal():
                         try:
                             # Execute analysis (with default parameters for world map collaboration)
                             result = get_world_map_collaboration(
-                                df=df,
+                                df=df.get(),
                                 edges_min=1,
                                 edgesize=5
                             )
@@ -8045,7 +8046,7 @@ def show_world_map_collaboration_table():
                                 result = countries_collaboration_network_results.get()
                                 if result is not None:
                                     _, world_map_table = result
-                                    return ui.HTML(DT(world_map_table, style="width=100%;"))
+                                    return ui.HTML(DT(world_map_table, style="width:100%;"))
                                 else:
                                     return ui.div(
                                         ui.p("Click the Run Analysis button to generate the world map collaboration table.", style="text-align: center; color: #666; font-size: 16px;"),
diff --git a/config.yaml b/config.yaml
new file mode 100644
index 000000000..bc39756b7
--- /dev/null
+++ b/config.yaml
@@ -0,0 +1,8 @@
+extraction:
+  query: "bibliometrics"
+  max_results: 50
+  source: "OPENALEX"
+
+paths:
+  output_csv: "standardized_output.csv"
+  log_file: "pipeline.log"
\ No newline at end of file
diff --git a/functions/get_affiliationproductionovertime.py b/functions/get_affiliationproductionovertime.py
index e1b87f583..310ee2fe7 100644
--- a/functions/get_affiliationproductionovertime.py
+++ b/functions/get_affiliationproductionovertime.py
@@ -12,9 +12,10 @@ def get_affiliation_production_over_time(df, top_k_affiliations):
     Returns:
         A Plotly figure object representing the affiliation's production over time.
     """
-    data = df.get()
+    data = df
 
-    AFF = data["AU_UN"].dropna().apply(lambda x: [aff for aff in x if aff.strip() != ""])
+    AFF_series = data["AU_UN"].fillna("").apply(lambda x: [aff for aff in (x if isinstance(x, list) else str(x).split(";")) if str(aff).strip() not in ["", "nan"]])
+    AFF = AFF_series
     nAFF = [len(aff) for aff in AFF]
 
     affiliations = [aff for sublist in AFF for aff in sublist]
diff --git a/functions/get_annualproduction.py b/functions/get_annualproduction.py
index dd27105c2..99166bb32 100644
--- a/functions/get_annualproduction.py
+++ b/functions/get_annualproduction.py
@@ -11,7 +11,7 @@ def get_annual_production(df):
     Returns:
         A Plotly figure object representing the annual scientific production.
     """
-    data = df.get()
+    data = df
 
     # Calculate the number of publications per year
     publications_per_year = data["PY"].value_counts().sort_index().reset_index()
diff --git a/functions/get_authorlocalimpact.py b/functions/get_authorlocalimpact.py
index 74a68e263..bf9a88c21 100644
--- a/functions/get_authorlocalimpact.py
+++ b/functions/get_authorlocalimpact.py
@@ -13,7 +13,7 @@ def get_authors_local_impact(df, num_of_authors_local_impact, author_local_impac
     Returns:
         A Plotly figure object and a DataFrame of the most impactful sources.
     """
-    df = df.get()
+    df = df
     today = pd.Timestamp.now().year
 
     # Ensure 'TC' and 'PY' are numeric
diff --git a/functions/get_authorproductionovertime.py b/functions/get_authorproductionovertime.py
index 65edaca96..ba1bf0a4d 100644
--- a/functions/get_authorproductionovertime.py
+++ b/functions/get_authorproductionovertime.py
@@ -16,7 +16,7 @@ def get_author_production_over_time(df, top_k_authors):
         table_authors_production (pd.DataFrame): Table summarizing authors' production with TC and TCpY.
         table_documents (pd.DataFrame): Detailed table with additional document information.
     """
-    data = df.get()
+    data = df
 
     # Ensure "PY" is numeric
     data["PY"] = pd.to_numeric(data["PY"], errors="coerce")
diff --git a/functions/get_averagecitations.py b/functions/get_averagecitations.py
index d752aa9b7..638a14849 100644
--- a/functions/get_averagecitations.py
+++ b/functions/get_averagecitations.py
@@ -11,7 +11,7 @@ def get_average_citations(df):
     Returns:
         A Plotly figure object representing the average citations per year.
     """
-    data = df.get()
+    data = df
 
     # Calculate the current year
     current_year = pd.Timestamp.now().year + 1
diff --git a/functions/get_bradfordlaw.py b/functions/get_bradfordlaw.py
index 86580591f..5ff8a0fec 100644
--- a/functions/get_bradfordlaw.py
+++ b/functions/get_bradfordlaw.py
@@ -12,7 +12,7 @@ def get_bradford_law(df):
         A Plotly figure object and a DataFrame of the Bradford's Law zones.
     """
     # Sort data by frequency of occurrence (equivalent to R's sort(table(M$SO), decreasing = TRUE))
-    data = df.get()
+    data = df
     source_counts = data["SO"].value_counts()
     
     # Total number of sources
@@ -67,7 +67,7 @@ def get_bradford_law(df):
     fig.add_shape(
         type="rect",
         x0=0,
-        x1=np.log(df_bradford["Rank"][a]),
+        x1=np.log(df_bradford["Rank"].iloc[int(a)-1]),
         y0=0,
         y1=df_bradford["Freq"].max(),
         fillcolor="#B3D1F2",
@@ -78,7 +78,7 @@ def get_bradford_law(df):
 
     # Add the "Core Sources" annotation with smaller font
     fig.add_annotation(
-        x=np.log(df_bradford["Rank"][a]) / 2,
+        x=np.log(df_bradford["Rank"].iloc[int(a)-1]) / 2,
         y=df_bradford["Freq"].max() * 0.85,
         text="<b>Core<br>Sources</b>",
         showarrow=False,
diff --git a/functions/get_bradfordlaw.py.bak b/functions/get_bradfordlaw.py.bak
new file mode 100644
index 000000000..569aaa4d3
--- /dev/null
+++ b/functions/get_bradfordlaw.py.bak
@@ -0,0 +1,126 @@
+from www.services import *
+
+
+def get_bradford_law(df):
+    """
+    Generate a plot and table based on Bradford's Law.
+    
+    Args:
+        df: A DataFrame object containing the data.
+        
+    Returns:
+        A Plotly figure object and a DataFrame of the Bradford's Law zones.
+    """
+    # Sort data by frequency of occurrence (equivalent to R's sort(table(M$SO), decreasing = TRUE))
+    data = df
+    source_counts = data["SO"].value_counts()
+    
+    # Total number of sources
+    n = source_counts.sum()
+    # Cumulative sum of the frequencies (equivalent to cumsum in R)
+    cumSO = source_counts.cumsum()
+    
+    # Define the cut points for Bradford's Law (zones)
+    cutpoints = [1, n * 0.33, n * 0.67, float('inf')]
+    groups = pd.cut(cumSO, bins=cutpoints, labels=["Zone 1", "Zone 2", "Zone 3"])
+    
+    # Find the cut points for "Core" sources
+    a = (cumSO < n * 0.33).sum() + 1
+    b = (cumSO < n * 0.67).sum() + 1
+    Z = ["Zone 1"] * a + ["Zone 2"] * (b - a) + ["Zone 3"] * (len(cumSO) - b)
+    
+    # Create a DataFrame for Bradford's Law table
+    df_bradford = pd.DataFrame({
+        "SO": cumSO.index.str[:25],  # Shorten the source names to 25 characters if necessary
+        "Rank": range(1, len(cumSO) + 1),
+        "Freq": source_counts.values,
+        "cumFreq": cumSO.values,
+        "Zone": Z
+    })
+    
+    # Create the Plotly figure
+    fig = go.Figure()
+
+    # Add the line plot without text above the points
+    fig.add_trace(go.Scatter(
+        x=np.log(df_bradford["Rank"]),
+        y=df_bradford["Freq"],
+        mode='lines+markers',
+        name='Articles per Source',
+        marker=dict(
+            color='#5567BB',
+            size=10,
+            line=dict(width=1, color='white'),
+            opacity=0.95
+        ),
+        line=dict(color='#5567BB', width=2, shape='spline'),
+        hovertemplate=(
+            "<b>Source:</b> %{customdata[0]}<br>"
+            "<b>Rank:</b> %{x:.2f}<br>"
+            "<b>N. of Documents:</b> %{y}<br>"
+            "<b>Zone:</b> %{customdata[1]}<extra></extra>"
+        ),
+        customdata=np.stack([df_bradford["SO"], df_bradford["Zone"]], axis=-1)
+    ))
+
+    # Add the "Core Sources" area with the rectangle
+    fig.add_shape(
+        type="rect",
+        x0=0,
+        x1=np.log(df_bradford["Rank"][a]),
+        y0=0,
+        y1=df_bradford["Freq"].max(),
+        fillcolor="#B3D1F2",
+        opacity=0.18,
+        line_width=0,
+        layer="below"
+    )
+
+    # Add the "Core Sources" annotation with smaller font
+    fig.add_annotation(
+        x=np.log(df_bradford["Rank"][a]) / 2,
+        y=df_bradford["Freq"].max() * 0.85,
+        text="<b>Core<br>Sources</b>",
+        showarrow=False,
+        font=dict(size=15, color="#5567BB", family="Segoe UI, Arial"),
+        align="center",
+        bgcolor="rgba(255,255,255,0.7)",
+        bordercolor="#B3D1F2",
+        borderpad=4,
+        borderwidth=1,
+    )
+
+    # Customize the X axis labels (log scale) with smaller font
+    fig.update_layout(
+        xaxis=dict(
+            title="Source log(Rank)",
+            tickmode='array',
+            tickvals=np.log(df_bradford["Rank"][:a]),
+            ticktext=df_bradford["SO"][:a],
+            tickangle=90,
+            showgrid=True,
+            gridcolor="#F0F0F0",
+            zeroline=False,
+            tickfont=dict(size=10),
+        ),
+        yaxis=dict(
+            title="N. of Documents",
+            showgrid=True,
+            gridcolor="#F0F0F0",
+            zeroline=False,
+            tickfont=dict(size=10),
+        ),
+        plot_bgcolor='white',
+        font=dict(color="#222222", size=11, family="Segoe UI, Arial"),
+        margin=dict(l=80, r=40, t=40, b=120),
+        height=800,
+        showlegend=False,
+        hoverlabel=dict(
+            bgcolor="white",
+            font_size=11,
+            font_family="Segoe UI, Arial",
+            bordercolor="#5567BB"
+        ),
+    )
+    
+    return fig, df_bradford
diff --git a/functions/get_citedcountries.py b/functions/get_citedcountries.py
index ac95a8d0c..07d9d65a2 100644
--- a/functions/get_citedcountries.py
+++ b/functions/get_citedcountries.py
@@ -15,7 +15,7 @@ def get_cited_countries(df, num_of_cited_countries, cited_countries_measure):
     """
     # Extract metadata tags for cited countries
     df = metaTagExtraction(df, "AU1_CO")
-    df = df.get()
+    df = df
 
     # Prepare the table for ranking countries
     tab = (
@@ -100,6 +100,7 @@ def get_cited_countries(df, num_of_cited_countries, cited_countries_measure):
 
     # Set x-axis ticks
     max_x = x_values.max()
+    max_x = 0 if pd.isna(max_x) else max_x
     tick_step = 5 if max_x <= 50 else int(max_x // 10) or 1
     x_ticks = list(range(0, int(max_x) + tick_step, tick_step))
     if x_ticks[-1] < max_x:
diff --git a/functions/get_citeddocuments.py b/functions/get_citeddocuments.py
index 14491f74a..badf146ae 100644
--- a/functions/get_citeddocuments.py
+++ b/functions/get_citeddocuments.py
@@ -14,8 +14,8 @@ def get_cited_documents(df, num_of_cited_docs, cited_docs_measure):
         A Plotly figure object and a DataFrame of the most cited documents.
     """
     # Extract metadata tags for cited documents
-    df = metaTagExtraction(df, "SR")
-    df = df.get()
+    if "SR" not in df.columns or (df["SR"] == "").all():
+        df = metaTagExtraction(df, "SR")
 
     # Prepare the table for ranking documents
     current_year = pd.to_datetime("today").year
diff --git a/functions/get_co_occurence_network.py b/functions/get_co_occurence_network.py
index ec96b143a..51ff616d0 100644
--- a/functions/get_co_occurence_network.py
+++ b/functions/get_co_occurence_network.py
@@ -136,7 +136,7 @@ def get_co_occurence_network(df, field_cn, ngram, network_layout, clustering_alg
 
     # Generate layout
     # Using default igraph layout
-    layout = cocnet['graph']['layout']
+    layout = cocnet['layout']
     print("Layout:", layout)
     # Get coordinates from layout
     coords = np.array([[pos[0], pos[1]] for pos in layout])
@@ -479,7 +479,7 @@ def field_by_year(df, field_cn, timespan=None, min_freq=2, n_items=5, remove_ter
         The field to analyze ('ID', 'DE', 'TI', 'AB', 'WC')
     """
     # Get the field data
-    M = df.get()
+    M = df
     
     # Create co-occurrence matrix
     A = cocMatrix(df, field_cn, binary=False, remove_terms=remove_terms, synonyms=synonyms)
diff --git a/functions/get_cocitation.py b/functions/get_cocitation.py
index 8bad105c0..a90f628a9 100644
--- a/functions/get_cocitation.py
+++ b/functions/get_cocitation.py
@@ -95,7 +95,7 @@ def get_co_citation(
         b = np.random.randint(0, 255)
         cluster_colors[cluster_id] = f"rgba({r},{g},{b},0.7)"
 
-    layout = cocitnet['graph']['layout']
+    layout = cocitnet['layout']
     coords = np.array([[pos[0], pos[1]] for pos in layout])
     coords = coords / np.abs(coords).max()
     coords[:, 0] *= 1000
diff --git a/functions/get_collaborationnetwork.py b/functions/get_collaborationnetwork.py
index 512ed7489..88213b9c5 100644
--- a/functions/get_collaborationnetwork.py
+++ b/functions/get_collaborationnetwork.py
@@ -46,7 +46,7 @@ def get_collaboration_network(
     print("Generating collaboration network...")
 
     M = df
-    m = df.get()
+    m = df
     NetRefs = None
     Title = ""
 
@@ -108,7 +108,7 @@ def get_collaboration_network(
         b = np.random.randint(0, 255)
         cluster_colors[cluster_id] = f"rgba({r},{g},{b},{opacity})"
 
-    layout = netplot['graph']['layout']
+    layout = netplot['layout']
     coords = np.array([[pos[0], pos[1]] for pos in layout])
     coords = coords / np.abs(coords).max()
     coords[:, 0] *= 1000
diff --git a/functions/get_correspondingauthorcountries.py b/functions/get_correspondingauthorcountries.py
index 5ba9832b2..f51a0004f 100644
--- a/functions/get_correspondingauthorcountries.py
+++ b/functions/get_correspondingauthorcountries.py
@@ -13,9 +13,11 @@ def get_corresponding_author_countries(df, top_k_countries):
         A Plotly figure object and a DataFrame of the most common corresponding author countries.
     """
     # Estrai i metadati "AU_CO" e "AU1_CO" e verifica il tipo di dati
-    df = metaTagExtraction(df, Field="AU_CO")  # Assumendo che `metaTagExtraction` sia già definita
-    df = metaTagExtraction(df, Field="AU1_CO")
-    data = df.get()  # Se `df` è un oggetto reattivo
+    if "AU_CO" not in df.columns or df["AU_CO"].apply(lambda x: isinstance(x, list) and len(x) == 0).all():
+        df = metaTagExtraction(df, Field="AU_CO")
+    if "AU1_CO" not in df.columns or (df["AU1_CO"] == "").all():
+        df = metaTagExtraction(df, Field="AU1_CO")
+    data = df  # Se `df` è un oggetto reattivo
 
     # Assicurati che le colonne siano di tipo stringa e rimuovi righe con valori mancanti
     data = data.dropna(subset=["AU1_CO", "AU_CO"])
diff --git a/functions/get_countriesproduction.py b/functions/get_countriesproduction.py
index 81c0e0c34..af8f474d0 100644
--- a/functions/get_countriesproduction.py
+++ b/functions/get_countriesproduction.py
@@ -13,7 +13,7 @@ def get_countries_production(df):
     """
     # Assicurati che i metadati siano stati estratti
     df = metaTagExtraction(df, "AU_CO")
-    df = df.get()
+    df = df
 
     # Conta le occorrenze dei paesi
     df["AU_CO"] = df["AU_CO"].apply(lambda x: x if isinstance(x, list) else [x])
diff --git a/functions/get_countriesproductionovertime.py b/functions/get_countriesproductionovertime.py
index aede25bbd..8039e12c4 100644
--- a/functions/get_countriesproductionovertime.py
+++ b/functions/get_countriesproductionovertime.py
@@ -13,7 +13,7 @@ def get_countries_production_over_time(df, top_k_countries):
         A Plotly figure object representing the country's production over time.
     """
     df = metaTagExtraction(df, "AU_CO")
-    data = df.get()
+    data = df
 
     AFF = pd.Series(data["AU_CO"]).dropna().apply(lambda x: [aff.strip() for aff in x if aff.strip() != ""])
     nAFF = [len(aff) for aff in AFF]
diff --git a/functions/get_factorialanalysis.py b/functions/get_factorialanalysis.py
index 3324bcfb6..1b08b177e 100644
--- a/functions/get_factorialanalysis.py
+++ b/functions/get_factorialanalysis.py
@@ -74,7 +74,7 @@ def get_factorial_analysis(
     # Set ngrams based on word_type
     ngrams = int(ngram) if field in ['TI', 'AB'] else 1
 
-    M = df.get()
+    M = df
     tab = table_tag(M, field, ngrams)
     
     if len(tab) >= 2:
@@ -136,8 +136,8 @@ def get_factorial_analysis(
 
             # Verifica che eigCorr esista prima di accedere
             if CS["res"] is not None and hasattr(CS["res"], "eigCorr"):
-                xlabel = f"Dim 1 ({CS['res'].eigCorr['perc'][dimX]:.2f}%)"
-                ylabel = f"Dim 2 ({CS['res'].eigCorr['perc'][dimY]:.2f}%)"
+                xlabel = f"Dim 1 ({CS["res"].eigCorr["perc"].iloc[dimX-1] if len(CS["res"].eigCorr["perc"]) > dimX-1 else 0:.2f}%)"
+                ylabel = f"Dim 2 ({CS['res'].eigCorr['perc'].iloc[dimY-1] if len(CS['res'].eigCorr['perc']) > dimY-1 else 0:.2f}%)"
             else:
                 xlabel, ylabel = "Dim 1", "Dim 2"
 
@@ -157,7 +157,8 @@ def get_factorial_analysis(
         wordCoord["dotSize"] = wordCoord["dotSize"].replace([np.inf, -np.inf], np.nan)
         wordCoord["dotSize"] = wordCoord["dotSize"].fillna(1)
         wordCoord["dotSize"] = wordCoord["dotSize"].clip(lower=1)
-        thres = sorted(wordCoord["dotSize"], reverse=True)[min(int(topWordPlot), len(wordCoord) - 1)]
+        topWordPlot_safe = min(int(topWordPlot) if np.isfinite(topWordPlot) else len(wordCoord), len(wordCoord) - 1)
+        thres = sorted(wordCoord["dotSize"], reverse=True)[topWordPlot_safe]
         wordCoord["labelToPlot"] = np.where(wordCoord["dotSize"] >= thres, wordCoord["label"], "")
 
         # Avoid label overlapping
@@ -950,7 +951,7 @@ def factorial(X, method, n_clusters=5, k_max=5):
         # Crea la lista `coord`
         coord_df = pd.DataFrame({
             "Dim1": cpc[:, 0],
-            "Dim2": cpc[:, 1],
+            "Dim2": cpc[:, 1] if cpc.shape[1] > 1 else np.zeros(len(cpc)),
             "label": levelnames
         })
         mask = coord_df["label"].str[-2:] == "_1"
diff --git a/functions/get_factorialanalysis.py.bak b/functions/get_factorialanalysis.py.bak
new file mode 100644
index 000000000..4d299dcf8
--- /dev/null
+++ b/functions/get_factorialanalysis.py.bak
@@ -0,0 +1,1180 @@
+from www.services import *
+from scipy.spatial import ConvexHull, QhullError
+
+def distance_to_y(dist, max_dist, scale_factor):
+    norm = math.log1p(dist) / math.log1p(max_dist)
+    return -norm * scale_factor
+
+def get_leaf_clusters(node, label_to_new_index, labels_lower, node_to_cluster):
+    if node.is_leaf():
+        label = labels_lower[node.id]
+        return {node_to_cluster[label_to_new_index[label]]}
+    left_clusters = get_leaf_clusters(node.left, label_to_new_index, labels_lower, node_to_cluster)
+    right_clusters = get_leaf_clusters(node.right, label_to_new_index, labels_lower, node_to_cluster)
+    return left_clusters.union(right_clusters)
+
+def _to_seq(val) -> List[str]:
+    """Flatten *val* to a list of strings, dropping NaN/None."""
+    if val is None or (isinstance(val, float) and pd.isna(val)):
+        return []
+    if isinstance(val, (list, tuple, set, np.ndarray)):
+        seq: Sequence = val  # type: ignore
+    else:
+        seq = [val]
+    out: List[str] = []
+    for x in seq:
+        if x is None or (isinstance(x, float) and pd.isna(x)):
+            continue
+        out.append(str(x))
+    return out
+
+def assign_consistent_colors(clusters):
+    palette = px.colors.qualitative.Plotly
+    unique_clusters = sorted(set(clusters.dropna()))
+    color_map = {cluster: palette[i % len(palette)] for i, cluster in enumerate(unique_clusters)}
+    color_map[np.nan] = "#CCCCCC"  # fallback per cluster NaN
+    return color_map
+
+
+def get_factorial_analysis(
+    df: pd.DataFrame,
+    ngram: Union[int, str] = 1,  
+    field: str = "ID",
+    terms_data_wm: Optional[Sequence[str]] = None,
+    synonyms_data_wm: Optional[Dict[str, str]] = None, 
+    n_terms: int = 50,
+    n_clusters: int = 5,
+    num_documents: Optional[int] = None,
+    method: str = "MCA",
+    dimX: int = 1,
+    dimY: int = 2,
+    topWordPlot: Union[int, float] = np.inf,
+    threshold: float = 0.10,
+    labelsize: int = 16,
+    size: int = 5,
+):
+    """Generate a 2‑D interactive *word map* for bibliometric data."""    
+    # Load terms to remove
+    remove_term = None
+    if terms_data_wm:
+        with open(terms_data_wm[0]['datapath'], 'r', encoding='utf-8') as file:
+            remove_term = [line.strip() for line in file]
+
+    # Load synonyms  
+    synonym = None
+    if synonyms_data_wm:
+        with open(synonyms_data_wm[0]['datapath'], 'r', encoding='utf-8') as file:
+            synonym = {}
+            for line in file:
+                terms = [term.strip() for term in line.split(',')]
+                key = terms[0] 
+                values = terms[1:]
+                synonym[key] = values
+
+    # Set ngrams based on word_type
+    ngrams = int(ngram) if field in ['TI', 'AB'] else 1
+
+    M = df
+    tab = table_tag(M, field, ngrams)
+    
+    if len(tab) >= 2:
+        # Get minimum degree threshold from the nth term
+        min_degree = list(tab.values())[min(n_terms, len(tab)-1)]
+
+        CS = conceptual_structure(
+            df=df,
+            method=method,
+            field=field,
+            min_degree=min_degree,
+            n_clusters=n_clusters,
+            k_max=8,
+            stemming=False,
+            labelsize=int(labelsize/2),
+            documents=num_documents,
+            graph=False,
+            ngrams=ngrams,
+            remove_terms=remove_term,
+            synonyms=synonym
+        )
+
+        if method != "MDS":
+            CSData = CS["docCoord"].copy()
+            CSData = CSData.reset_index().rename(columns={"index": "Documents"})
+            CSData["dim1"] = CSData["dim1"].round(2)
+            CSData["dim2"] = CSData["dim2"].round(2)
+            CSData["contrib"] = CSData["contrib"].round(2)
+            CS["CSData"] = CSData
+        else:
+            CS["CSData"] = pd.DataFrame({"Documents": [None], "dim1": [None], "dim2": [None]})
+
+        if method in {"CA", "MCA"}:
+            WData = pd.DataFrame(CS["km_res"]["data"], columns=["Dim1", "Dim2"])
+            WData["word"] = CS["km_res"]["data"].index
+            WData["cluster"] = CS["km_res"]["data"]["cluster"]
+        elif method == "MDS":
+            WData = pd.DataFrame(CS["res"], columns=["Dim1", "Dim2"])
+            WData["word"] = CS["res"].index
+            WData["cluster"] = CS["km_res"]["cluster"]
+
+        WData = WData.round({"Dim1": 2, "Dim2": 2})
+        CS["WData"] = WData
+
+        LABEL = WData["word"]
+
+        if method in {"CA", "MCA"}:
+            WData = CS["km_res"]["data"].copy()
+            WData = WData.reset_index().rename(columns={"index": "word"})
+            if "cluster" not in WData.columns and "cluster" in CS["km_res"]:
+                WData["cluster"] = CS["km_res"]["cluster"]
+            elif "cluster" not in WData.columns:
+                WData["cluster"] = np.nan
+            wordCoord = WData[["Dim1", "Dim2", "word", "cluster"]].copy()
+            wordCoord.rename(columns={"word": "label", "cluster": "groups"}, inplace=True)
+            contrib = CS["coord"]["contrib"].sum(axis=1) / 2
+            wordCoord["label"] = wordCoord["label"].values
+            wordCoord["contrib"] = np.array(contrib).flatten()
+
+            # Verifica che eigCorr esista prima di accedere
+            if CS["res"] is not None and hasattr(CS["res"], "eigCorr"):
+                xlabel = f"Dim 1 ({CS["res"].eigCorr["perc"].iloc[dimX-1] if len(CS["res"].eigCorr["perc"]) > dimX-1 else 0:.2f}%)"
+                ylabel = f"Dim 2 ({CS['res'].eigCorr['perc'].iloc[dimY-1] if len(CS['res'].eigCorr['perc']) > dimY-1 else 0:.2f}%)"
+            else:
+                xlabel, ylabel = "Dim 1", "Dim 2"
+
+        elif method == "MDS":
+            wordCoord = WData[["Dim1", "Dim2", "word", "cluster"]].copy()
+            wordCoord.rename(columns={"word": "label", "cluster": "groups"}, inplace=True)
+            wordCoord.rename(columns={"word": "label", "cluster": "groups"}, inplace=True)
+            wordCoord["contrib"] = size / 2  # MDS non ha contribuzioni vere
+            xlabel, ylabel = "Dim 1", "Dim 2"
+
+
+        ymax = wordCoord["Dim2"].max() - wordCoord["Dim2"].min()
+        xmax = wordCoord["Dim1"].max() - wordCoord["Dim1"].min()
+        threshold2 = threshold * np.mean([xmax, ymax])
+
+        wordCoord["dotSize"] = wordCoord["contrib"] + size
+        wordCoord["dotSize"] = wordCoord["dotSize"].replace([np.inf, -np.inf], np.nan)
+        wordCoord["dotSize"] = wordCoord["dotSize"].fillna(1)
+        wordCoord["dotSize"] = wordCoord["dotSize"].clip(lower=1)
+        topWordPlot_safe = min(int(topWordPlot) if np.isfinite(topWordPlot) else len(wordCoord), len(wordCoord) - 1)
+        thres = sorted(wordCoord["dotSize"], reverse=True)[topWordPlot_safe]
+        wordCoord["labelToPlot"] = np.where(wordCoord["dotSize"] >= thres, wordCoord["label"], "")
+
+        # Avoid label overlapping
+        # Placeholder for avoidOverlaps logic
+        # labelToRemove = avoidOverlaps(wordCoord, threshold=threshold2, dimX=dimX, dimY=dimY)
+        # wordCoord["labelToPlot"] = np.where(wordCoord["labelToPlot"].isin(labelToRemove), "", wordCoord["labelToPlot"])
+        # wordCoord["label"] = wordCoord["label"].str.replace("_1", "", regex=False)
+        # wordCoord["labelToPlot"] = wordCoord["labelToPlot"].str.replace("_1", "", regex=False)
+
+
+        ####################################### WORD MAP #######################################
+        # Palette cluster
+        group_colors = assign_consistent_colors(wordCoord["groups"])
+
+        # Hover arricchito
+        hoverText = [
+            f"<b>{row['label']}</b><br>Cluster: {row['groups'] if 'groups' in row else ''}<br>Contrib: {row['contrib']:.3f}"
+            for _, row in wordCoord.iterrows()
+        ]
+
+        fig = go.Figure()
+
+        # Marker colorati per cluster, trasparenti, bordo sottile
+        for g in sorted(wordCoord["groups"].dropna().unique()):
+            group_df = wordCoord[wordCoord["groups"] == g]
+            fig.add_trace(
+            go.Scatter(
+                x=group_df["Dim1"],
+                y=group_df["Dim2"],
+                mode="markers",
+                marker=dict(
+                size=group_df["dotSize"],
+                color=group_colors.get(g, "#FF0000"),  # fallback colore
+                opacity=0.7,
+                line=dict(width=0.7, color="black"),
+                symbol="circle",
+                ),
+                opacity=0.7,
+                text=group_df["label"],
+                hovertext=[
+                f"<b>{row['label']}</b><br>Cluster: {row['groups']}<br>Contrib: {row['contrib']:.3f}"
+                for _, row in group_df.iterrows()
+                ],
+                hoverinfo="text",
+                name=f"Cluster {g}",
+                showlegend=False,
+            )
+            )
+
+        # Aggiungi i NaN separatamente (se esistono)
+        group_df_nan = wordCoord[wordCoord["groups"].isna()]
+        if not group_df_nan.empty:
+            fig.add_trace(
+            go.Scatter(
+                x=group_df_nan["Dim1"],
+                y=group_df_nan["Dim2"],
+                mode="markers",
+                marker=dict(
+                size=group_df_nan["dotSize"],
+                color="#FF9999",
+                opacity=0.7,
+                line=dict(width=0.7, color="black"),
+                symbol="circle",
+                ),
+                opacity=0.7,
+                text=group_df_nan["label"],
+                hovertext=[
+                f"<b>{row['label']}</b><br>Cluster: N/A<br>Contrib: {row['contrib']:.3f}"
+                for _, row in group_df_nan.iterrows()
+                ],
+                hoverinfo="text",
+                name="No Cluster",
+                showlegend=False,
+            )
+            )
+
+        # Aggiungi contorni dei cluster (Convex Hull)
+        if n_clusters != 1 and "hull_data" in CS and CS["hull_data"] is not None and not CS["hull_data"].empty:
+            hull_data = CS["hull_data"]
+            for cluster_id in hull_data["cluster"].unique():
+                group = hull_data[hull_data["cluster"] == cluster_id]
+                fig.add_trace(
+                    go.Scatter(
+                    x=group["Dim1"],
+                    y=group["Dim2"],
+                    mode="lines",
+                    line=dict(color=group_colors.get(cluster_id, "gray"), width=2),
+                    fill="toself",
+                    opacity=0.15,
+                    hoverinfo="skip",
+                    showlegend=False
+                    )
+                )
+
+        # Etichette solo per i top word (labelToPlot), spostate più in alto rispetto ai pallini
+        # Offset dinamico in base alla dimensione verticale del grafico
+        label_offset = 0.03 * (wordCoord["Dim2"].max() - wordCoord["Dim2"].min())
+
+        for _, row in wordCoord[wordCoord["labelToPlot"] != ""].iterrows():
+            fig.add_annotation(
+            x=row["Dim1"],
+            y=row["Dim2"] + label_offset,
+            text=row["labelToPlot"],
+            font=dict(size=labelsize, color=group_colors.get(row["groups"], "black")),
+            showarrow=False,
+            )
+
+        # Assi X=0 e Y=0, grigi e tratteggiati
+        fig.add_shape(
+            type="line",
+            x0=wordCoord["Dim1"].min(),
+            x1=wordCoord["Dim1"].max(),
+            y0=0,
+            y1=0,
+            line=dict(color="#B0B0B0", width=1.5, dash="dash"),
+            layer="below"
+        )
+        fig.add_shape(
+            type="line",
+            x0=0,
+            x1=0,
+            y0=wordCoord["Dim2"].min(),
+            y1=wordCoord["Dim2"].max(),
+            line=dict(color="#B0B0B0", width=1.5, dash="dash"),
+            layer="below"
+        )
+
+        # Personalizza l'hovertemplate per renderlo leggibile e carino
+        for trace in fig.data:
+            trace.hovertemplate = (
+            "<b>%{text}</b><br>"
+            "Cluster: %{marker.color}<br>"
+            "Contribuzione: %{marker.size:.2f}<extra></extra>"
+            )
+
+        fig.update_layout(
+            xaxis=dict(
+            title=xlabel,
+            zeroline=True,
+            zerolinewidth=1.5,
+            zerolinecolor="#B0B0B0",
+            showgrid=True,
+            gridcolor="lightgray",
+            showline=False,
+            showticklabels=True
+            ),
+            yaxis=dict(
+            title=ylabel,
+            zeroline=True,
+            zerolinewidth=1.5,
+            zerolinecolor="#B0B0B0",
+            showgrid=True,
+            gridcolor="lightgray",
+            showline=False,
+            showticklabels=True
+            ),
+            plot_bgcolor="rgba(0,0,0,0)",
+            paper_bgcolor="rgba(0,0,0,0)",
+            showlegend=False,
+            height=800,
+            hoverlabel=dict(
+            bgcolor="white",
+            font_size=13,
+            font_family="Segoe UI, Arial",
+            bordercolor="#5567BB"
+            ),
+        )
+        fig = go.FigureWidget(fig)
+        fig._config = fig._config | {'modeBarButtonsToRemove': ['pan', 'select', 'lasso2d', 'toImage'],
+                                     'displaylogo': False}
+
+        #####################################################################################
+
+        ################################### DENDROGRAM COERENTE CON WORD MAP ###################################
+        import networkx as nx
+        from pyvis.network import Network
+        from scipy.cluster.hierarchy import linkage, to_tree
+        from pathlib import Path
+        from scipy.cluster.hierarchy import optimal_leaf_ordering
+        from scipy.spatial.distance import pdist
+        import math
+        import tempfile
+        import os
+
+        # 1. Linkage, labels, cluster mapping
+        labels_lower = CS["km_res"]["data"].index.str.lower().tolist()
+        coords = CS["km_res"]["data"][["Dim1", "Dim2"]].values
+        linkage_matrix = CS["linkage"]
+
+        word_to_cluster = dict(zip(WData["word"], WData["cluster"]))
+        group_colors = assign_consistent_colors(WData["cluster"])
+        leaf_offset = len(labels_lower)
+
+        # 2. Ordina le parole secondo dendrogramma
+        ddata = dendrogram(linkage_matrix, labels=labels_lower, no_plot=True)
+        words_sorted = ddata["ivl"]
+        n_terms = len(words_sorted)
+        scale_factor = int(500 * math.log2(n_terms + 1))  # log-scale vertical height
+
+        # 3. Inizializza rete Pyvis
+        tree, nodes = to_tree(linkage_matrix, rd=True)
+        net = Network(height="98vh", width="100%", directed=True, notebook=True, cdn_resources="in_line")
+        net.toggle_physics(False)
+        positions = {}
+        label_boxes = []
+        node_to_cluster = {}
+
+        leaf_x = 0
+        x_spacing = 100
+        label_to_new_index = {label: i for i, label in enumerate(words_sorted)}
+
+        # Per memorizzare cambi cluster
+        cut_lines = {}
+
+        # FOGUE
+        for i, label in enumerate(words_sorted):
+            node_id = i
+            x = leaf_x
+            y = 0
+            cluster = word_to_cluster.get(label.lower(), -1)
+            color = group_colors.get(cluster, "#999999")
+            node_to_cluster[node_id] = cluster
+            positions[node_id] = (x, y)
+
+            # Nodo foglia
+            net.add_node(
+                node_id,
+                label=" ",
+                color=color,
+                shape="dot",
+                size=6,
+                title=label,
+                font={"size": 18, "face": "arial"},
+                physics=False,
+                x=x,
+                y=y + 40
+            )
+
+            # Nodo stub
+            stub_y = y - 20
+            stub_id = f"stub_{node_id}"
+            positions[stub_id] = (x, stub_y)
+            net.add_node(
+                stub_id,
+                label=" ",
+                title=" ",
+                color="#00000000",
+                shape="dot",
+                size=1,
+                physics=False,
+                x=x,
+                y=stub_y,
+                font={"color": "#00000000", "size": 1}
+            )
+
+            net.add_edge(
+                stub_id,
+                node_id,
+                label=" ",
+                color=color,
+                width=10,
+                smooth=False,
+                physics=False,
+                arrows=""
+            )
+
+            # Label HTML dinamica
+            box_html = f"""
+            <div id="label-{node_id}" class="floating-label" style="background-color: {color};">
+            {label.upper()}
+            </div>
+            """
+            label_boxes.append(box_html)
+            leaf_x += x_spacing
+
+        # MERGE
+        def add_internal_nodes(node):
+            if node.is_leaf():
+                label = labels_lower[node.id]
+                new_id = label_to_new_index[label]
+                stub_id = f"stub_{new_id}"
+                return positions[stub_id], stub_id
+
+            # 1. Ricorsione sui figli
+            left_pos, left_stub_id = add_internal_nodes(node.left)
+            right_pos, right_stub_id = add_internal_nodes(node.right)
+
+            # 2. Coordinate del nodo interno
+            x_center = (left_pos[0] + right_pos[0]) / 2
+            y = min(left_pos[1], right_pos[1])
+            max_dist = linkage_matrix[:, 2].max()
+            stub_y = distance_to_y(node.dist, max_dist, scale_factor)
+
+
+            node_id = node.id + leaf_offset
+            stub_id = f"stub_{node_id}"
+            positions[node_id] = (x_center, y)
+            positions[stub_id] = (x_center, stub_y)
+            total = node.count
+
+            # 3. Colore cluster (ereditato dal figlio sinistro)
+            left_cluster = node_to_cluster.get(
+                node.left.id + leaf_offset if not node.left.is_leaf() else label_to_new_index[labels_lower[node.left.id]],
+                -1
+            )
+            right_cluster = node_to_cluster.get(
+                node.right.id + leaf_offset if not node.right.is_leaf() else label_to_new_index[labels_lower[node.right.id]],
+                -1
+            )
+
+            cluster = left_cluster
+            node_to_cluster[node_id] = cluster
+            color = group_colors.get(cluster, "#999999")
+
+            # 4. Nodo interno
+            net.add_node(
+                node_id,
+                label=" ",
+                shape="dot",
+                size=20,
+                physics=False,
+                x=x_center,
+                y=y,
+                title=f"Distance: {node.dist:.2f} Words: {total}",
+                color={
+                    "background": "#FFFFFF",   # Riempimento bianco
+                    "border": "#3399FF",       # Bordo blu tenue
+                    "highlight": "#000000"     # Colore al passaggio mouse (opzionale)
+                },
+                borderWidth=2,
+            )
+
+
+            # 5. Nodo stub sopra
+            net.add_node(
+                stub_id,
+                label=" ",
+                title=f"Distance: {node.dist:.2f} Words: {total}",
+                color="#00000000",
+                shape="dot",
+                size=4,
+                physics=False,
+                x=x_center,
+                y=stub_y,
+                font={"color": "#00000000", "size": 1}
+            )
+
+            # 6. Edge verticale (stub → nodo)
+            if node != tree:
+                net.add_edge(
+                    stub_id,
+                    node_id,
+                    label=" ",
+                    title=f"Distance: {node.dist:.2f} Words: {node.count}",
+                    color=color,
+                    width=10,
+                    smooth=False,
+                    physics=False,
+                    arrows=""
+                )
+
+            # 7. Collega i due figli
+            for child_stub_id in [left_stub_id, right_stub_id]:
+                child_x, child_y = positions[child_stub_id]
+                inter_id = f"{node_id}_{child_stub_id}_v"
+                inter_y = y
+
+                net.add_node(
+                    inter_id,
+                    label=" ",
+                    title=" ",
+                    color="#00000000",
+                    shape="dot",
+                    size=1,
+                    physics=False,
+                    x=child_x,
+                    y=inter_y
+                )
+
+                # print(f"[HLINE] Nodo {node_id} connesso a {child_stub_id} a y={inter_y:.2f}")
+
+                net.add_edge(
+                    node_id,
+                    inter_id,
+                    color=color,
+                    title=f"Distance: {node.dist:.2f} Words: {node.count}",
+                    width=10,
+                    smooth=False,
+                    physics=False,
+                    arrows=""
+                )
+                net.add_edge(
+                    inter_id,
+                    child_stub_id,
+                    color=color,
+                    title=f"Distance: {node.dist:.2f} Words: {node.count}",
+                    width=10,
+                    smooth=False,
+                    physics=False,
+                    arrows=""
+                )
+
+            # 8. Linea di taglio (se cambia cluster)
+            left_leaf_clusters = get_leaf_clusters(node.left, label_to_new_index, labels_lower, node_to_cluster)
+            right_leaf_clusters = get_leaf_clusters(node.right, label_to_new_index, labels_lower, node_to_cluster)
+
+            if left_leaf_clusters.isdisjoint(right_leaf_clusters):
+                cl1 = min(left_leaf_clusters)
+                cl2 = min(right_leaf_clusters)
+                cluster_pair = tuple(sorted((cl1, cl2)))
+                if cluster_pair not in cut_lines:
+                    cut_lines[cluster_pair] = y  # posizione reale della fusione visibile
+                    # print(f"[CUT LINE] Cambio cluster {cluster_pair} a y = {stub_y:.2f}")
+
+
+            return (x_center, stub_y), stub_id
+
+        # Costruisci
+        _, root_stub_id = add_internal_nodes(tree)
+
+        # Aggiungi linee rosse di taglio
+        # Aggiungi solo la linea di taglio più bassa (cioè y più vicino allo 0)
+        if cut_lines:
+            # Trova la coppia con il max y (cioè la linea di taglio più bassa visivamente)
+            (cl1, cl2), y = max(cut_lines.items(), key=lambda x: x[1])
+
+            net.add_node(
+                f"cut_{cl1}_{cl2}_left", x=0, y=y, label="", shape="dot", size=0.1, color="#FF0000", physics=False
+            )
+            net.add_node(
+                f"cut_{cl1}_{cl2}_right", x=(leaf_x - x_spacing), y=y, label="", shape="dot", size=0.1, color="#FF0000", physics=False
+            )
+            net.add_edge(
+                f"cut_{cl1}_{cl2}_left",
+                f"cut_{cl1}_{cl2}_right",
+                label=f"cut @ y={y:.1f}",
+                color="#FF0000",
+                width=20,
+                physics=False,
+                arrows=""
+            )
+
+        # 1. Salva grafo base in HTML
+        html = net.generate_html()
+
+        # 2. Inietta etichette HTML
+        injection = f"""
+        <style>
+        .floating-label {{
+            position: absolute;
+            writing-mode: vertical-rl;
+            transform: rotate(180deg);
+            font-size: 14px;
+            border: 1px solid #999;
+            padding: 2px;
+            text-align: center;
+            line-height: 1.1;
+            z-index: 999;
+            pointer-events: none;
+        }}
+        </style>
+        {''.join(label_boxes)}
+        <script>
+        function updateLabels() {{
+            var canvas = document.getElementsByTagName("canvas")[0];
+            var rect = canvas.getBoundingClientRect();
+            var pos = network.getPositions();
+            for (var id in pos) {{
+                var domPos = network.canvasToDOM(pos[id]);
+                var el = document.getElementById("label-" + id);
+                if (el) {{
+                    el.style.left = (rect.left + domPos.x + window.scrollX -5) + "px";
+                    el.style.top = (rect.top + domPos.y + window.scrollY + 10) + "px";
+                }}
+            }}
+        }}
+        network.on("afterDrawing", updateLabels);
+        window.addEventListener("resize", updateLabels);
+        </script>
+        """
+
+        html = html.replace("</body>", injection + "\n</body>")
+
+        # 3. Salvataggio file
+        tmp = tempfile.NamedTemporaryFile(delete=False, suffix=".html")
+        html_path = tmp.name
+        with open(html_path, 'w', encoding="utf-8") as f:
+            new_css = "     .card {\n                 border: none;\n             }"
+            updated_html = html.replace("</style>", new_css + "\n        </style>")
+            updated_html = updated_html.replace("1px solid lightgray", "none")
+            
+            f.write(updated_html)
+
+        ############################################
+        words_by_cluster = WData[["word", "Dim1", "Dim2", "cluster"]].copy()
+
+        # 5. Restituisci
+        return fig, html_path.split(os.sep)[-1], words_by_cluster, CS["CSData"]
+
+
+def conceptual_structure(
+    df: pd.DataFrame,
+    field: str = "ID",
+    ngrams: int = 1,
+    method: str = "MCA",
+    min_degree: int = 2,
+    n_clusters: Union[str, int] = "auto",
+    k_max: int = 5,
+    stemming: bool = False,
+    labelsize: int = 10,
+    documents: int = 2,
+    graph: bool = True,
+    remove_terms: Optional[Sequence[str]] = None,
+    synonyms: Optional[Dict[str, str]] = None
+) -> Dict:
+    # Set binary flag based on method
+    binary = method == "MCA"
+    
+    # Create co-occurrence matrix based on field
+    if field == "ID":
+        CW = cocMatrix(df, Field="ID", binary=binary, remove_terms=remove_terms, synonyms=synonyms)
+        CW = CW.loc[:, CW.sum() >= min_degree]
+        CW = CW.loc[CW.sum(axis=1) > 0]
+        CW = CW.loc[:, ~CW.columns.isin(["NA"])]
+
+    elif field == "DE":
+        CW = cocMatrix(df, Field="DE", binary=binary, remove_terms=remove_terms, synonyms=synonyms)
+        CW = CW.loc[:, CW.sum() >= min_degree]
+        CW = CW.loc[CW.sum(axis=1) > 0]
+        CW = CW.loc[:, ~CW.columns.isin(["NA"])]
+
+    elif field == "ID_TM":
+        df = term_extraction(df, field="ID", stemming=stemming, remove_terms=remove_terms, synonyms=synonyms, ngrams=ngrams)
+        CW = cocMatrix(df, Field="ID_TM", binary=binary)
+        CW = CW.loc[:, CW.sum() >= min_degree]
+        CW = CW.loc[CW.sum(axis=1) > 0]
+        CW = CW.loc[:, ~CW.columns.isin(["NA"])]
+
+    elif field == "DE_TM":
+        df = term_extraction(df, field="DE", stemming=stemming, remove_terms=remove_terms, synonyms=synonyms, ngrams=ngrams)
+        CW = cocMatrix(df, Field="DE_TM", binary=binary)
+        CW = CW.loc[:, CW.sum() >= min_degree]
+        CW = CW.loc[CW.sum(axis=1) > 0]
+        CW = CW.loc[:, ~CW.columns.isin(["NA"])]
+
+    elif field == "TI":
+        df = term_extraction(df, field="TI", stemming=stemming, remove_terms=remove_terms, synonyms=synonyms, ngrams=ngrams)
+        CW = cocMatrix(df, Field="TI_TM", binary=binary)
+        CW = CW.loc[:, CW.sum() >= min_degree]
+        CW = CW.loc[CW.sum(axis=1) > 0]
+        CW = CW.loc[:, ~CW.columns.isin(["NA"])]
+
+    elif field == "AB":
+        df = term_extraction(df, field="AB", stemming=stemming, remove_terms=remove_terms, synonyms=synonyms, ngrams=ngrams)
+        CW = cocMatrix(df, Field="AB_TM", binary=binary)
+        CW = CW.loc[:, CW.sum() >= min_degree]
+        CW = CW.loc[CW.sum(axis=1) > 0]
+        CW = CW.loc[:, ~CW.columns.isin(["NA"])]
+
+    # Convert labels to lowercase
+    CW.columns = CW.columns.str.lower()
+    CW.index = CW.index.str.lower()
+
+    # print("CW", CW)
+    
+    # Run factorial analysis
+    results = factorial(CW, method=method, n_clusters=n_clusters, k_max=k_max)
+    res_mca = results['res_mca'] if 'res_mca' in results else None
+
+    if res_mca is not None:
+        doc_coord = results['docCoord']
+    else:
+        doc_coord = None
+
+    df = results.get('df', results.get('res'))
+
+    df.index = CW.columns
+    doc_coord = results['docCoord']
+
+    # Add total citations if available
+    # Add total citations if available and method is not "MDS"
+    if "TC" in df.columns and method != "MDS":
+        # Try to match doc_coord index to df index (case-insensitive)
+        doc_coord = doc_coord.copy()
+        doc_coord_index_upper = doc_coord.index.astype(str).str.upper()
+        df_index_upper = df.index.astype(str).str.upper()
+        tc_map = dict(zip(df_index_upper, df["TC"].astype(float)))
+        doc_coord["TC"] = doc_coord_index_upper.map(tc_map)
+
+    # Perform hierarchical clustering
+    # km_res vis_hclust pyvis
+    km_res = linkage(pdist(df, metric='euclidean'), method='average')
+    results['linkage'] = km_res
+
+    # Determine the number of clusters
+    if n_clusters == "auto":
+        heights = np.diff(km_res[:, 2])
+        n_clusters = min(len(heights) - np.argmax(heights) + 1, k_max)
+    else:
+        n_clusters = max(1, min(int(n_clusters), k_max))
+
+    # Assign clusters to data points
+    cluster_labels = fcluster(km_res, n_clusters, criterion='maxclust')
+    df = df.copy()
+    df['cluster'] = cluster_labels
+
+    # Create data.clust (dataframe with data and cluster)
+    data_clust = df.copy()
+
+    # Calculate cluster centers
+    centers = data_clust.groupby('cluster').agg({
+        'Dim1': 'mean',
+        'Dim2': 'mean'
+    }).reset_index()
+
+    # Reorder columns to match R: Dim1, Dim2, cluster
+    centers = centers[['Dim1', 'Dim2', 'cluster']]
+
+    # Add shape and label columns
+    data_clust['shape'] = "1"
+    data_clust['label'] = data_clust.index.astype(str)
+    centers['shape'] = "0"
+    centers['label'] = ""
+
+    # Concatenate data_clust and centers
+    df_clust = pd.concat([data_clust, centers], ignore_index=True, sort=False)
+
+    # Assign color by cluster (using Plotly palette)
+    colorlist = px.colors.qualitative.Plotly
+    df_clust['color'] = df_clust['cluster'].apply(lambda x: colorlist[int(x) % len(colorlist)] if pd.notnull(x) else "#CCCCCC")
+
+    # Create hull data for plotting (similar to R dplyr + chull logic)
+    hull_data_list = []
+    for cluster in df_clust['cluster'].dropna().unique():
+        group = df_clust[df_clust['cluster'] == cluster]
+        if len(group) >= 3:
+            try:
+                hull_idx = ConvexHull(group[['Dim1', 'Dim2']]).vertices
+                hull_points = group.iloc[hull_idx]
+                # Chiudi il poligono (aggiungi il primo punto alla fine)
+                hull_points = pd.concat([hull_points, hull_points.iloc[[0]]])
+            except QhullError as e:
+                # print(f"[WARN] ConvexHull fallito per cluster {cluster}: {e}")
+                # Fallback: rettangolo minimo
+                x_min, x_max = group["Dim1"].min(), group["Dim1"].max()
+                y_min, y_max = group["Dim2"].min(), group["Dim2"].max()
+                hull_points = pd.DataFrame({
+                    "Dim1": [x_min, x_max, x_max, x_min, x_min],
+                    "Dim2": [y_min, y_min, y_max, y_max, y_min],
+                    "cluster": cluster
+                })
+            hull_data_list.append(hull_points)
+
+    if hull_data_list:
+        hull_data = pd.concat(hull_data_list)
+        # For each cluster, add the first point again to close the polygon
+        hull_data = pd.concat([
+            hull_data,
+            hull_data.groupby('cluster').head(1)
+        ])
+        hull_data = hull_data.reset_index(drop=True)
+        hull_data['id'] = hull_data.groupby('cluster').cumcount() + 1
+        hull_data = hull_data.sort_values(['cluster', 'id'])
+    else:
+        hull_data = pd.DataFrame()
+
+    if doc_coord is not None:
+        results = {
+            'net': CW,
+            'res': res_mca,
+            'km_res': {'data': df, 'centers': centers},
+            'docCoord': doc_coord,
+            'coord': results['coord'] if 'coord' in results else None,
+            'hull_data': hull_data,
+            'linkage': km_res
+        }
+    else:
+        results = {
+            'net': CW,
+            'res': df,
+            'km_res': {
+                'data': df,
+                'centers': centers,
+                'cluster': df['cluster']
+            },
+            'docCoord': None,
+            'coord': None,
+            'hull_data': hull_data,
+            'linkage': km_res
+        }
+
+    params = {
+        'field': field,
+        'ngrams': ngrams,
+        'method': method,
+        'min_degree': min_degree,
+        'n_clusters': n_clusters,
+        'k_max': k_max,
+        'stemming': stemming,
+        'labelsize': labelsize,
+        'documents': documents,
+        'graph': graph,
+        'remove_terms': remove_terms,
+        'synonyms': synonyms
+    }
+    params_df = pd.DataFrame({
+        'params': list(params.keys()),
+        'values': [str(params[k]) for k in params]
+    })
+    results['params'] = params_df
+
+    return results
+
+
+def factorial(X, method, n_clusters=5, k_max=5):
+    """
+    Perform factorial analysis on the input data.
+
+    Args:
+        X: Input data (e.g., co-occurrence matrix).
+        method: Analysis method ("CA", "MCA", "MDS").
+
+    Returns:
+        A dictionary containing the results of the factorial analysis.
+    """
+    if method == "CA":
+        res_mca = CA(n_components=2).fit(X)
+
+        row_coords = res_mca.row_coordinates(X)
+        col_coords = res_mca.column_coordinates(X)
+
+        K = 2
+        I, J = row_coords.shape[0], col_coords.shape[0]
+
+        singular_values = np.linalg.norm(row_coords.values, axis=0)[:K]
+        evF = np.tile(singular_values, (I, 1))
+        evG = np.tile(singular_values, (J, 1))
+
+        rpc = row_coords.iloc[:, :K].values * evF
+        cpc = col_coords.iloc[:, :K].values * evG
+
+        column_masses = (X.sum(axis=0) / X.values.sum()).values
+        column_distances = np.sum(cpc**2, axis=1)
+
+        coord = {
+            "coord": pd.DataFrame(cpc[:, :2], columns=["Dim1", "Dim2"], index=col_coords.index),
+            "contrib": pd.DataFrame((cpc[:, :2] ** 2) * column_masses[:, None] / singular_values, columns=["Dim1", "Dim2"], index=col_coords.index),
+            "cos2": pd.DataFrame((cpc[:, :2] ** 2) / column_distances[:, None], columns=["Dim1", "Dim2"], index=col_coords.index)
+        }
+
+        coord_doc = {
+            "coord": pd.DataFrame(rpc[:, :2], columns=["Dim1", "Dim2"], index=row_coords.index),
+            "contrib": pd.DataFrame((rpc[:, :2] ** 2), columns=["Dim1", "Dim2"], index=row_coords.index),
+            "cos2": pd.DataFrame((rpc[:, :2] ** 2) / np.sum(rpc[:, :2] ** 2, axis=1)[:, None], columns=["Dim1", "Dim2"], index=row_coords.index)
+        }
+
+
+    elif method == "MCA":
+        
+        # Multiple Correspondence Analysis
+        X = X.apply(lambda col: col.astype("category"))
+        res_mca = MCA(n_components=2).fit(X)
+
+        # Estrai i nomi dei livelli (equivalente di `res.mca$levelnames` in R)
+        levelnames = [f"{col}_{val}" for col in X.columns for val in X[col].cat.categories]
+
+        K = 2
+        row_coords = res_mca.row_coordinates(X)
+        col_coords = res_mca.column_coordinates(X)
+        I, J = row_coords.shape[0], col_coords.shape[0]
+
+        # Stima dei valori singolari
+        # I valori singolari possono essere stimati come la norma delle prime componenti
+        singular_values = np.linalg.norm(row_coords.values, axis=0)[:2]
+
+        # Crea le matrici evF ed evG replicando i valori singolari
+        evF = np.tile(singular_values, (I, 1))  # Matrice di dimensione (I, K)
+        evG = np.tile(singular_values, (J, 1))  # Matrice di dimensione (J, K)
+
+        rpc = row_coords.iloc[:, :K].values * evF
+        cpc = col_coords.iloc[:, :K].values * evG
+
+        # Calcolo delle masse delle colonne
+        column_frequencies = X.apply(lambda col: col.value_counts(normalize=True)).fillna(0)
+        column_mass = column_frequencies.values.flatten()  # Vettore delle masse delle colonne
+
+        # Calcolo delle distanze delle colonne
+        column_distances = np.sum(cpc**2, axis=1)  # Calcola la somma dei quadrati delle coordinate
+
+        # Crea la lista `coord`
+        coord_df = pd.DataFrame({
+            "Dim1": cpc[:, 0],
+            "Dim2": cpc[:, 1],
+            "label": levelnames
+        })
+        mask = coord_df["label"].str[-2:] == "_1"
+        coord = {
+            "coord": coord_df[mask].drop(columns=["label"]).reset_index(drop=True),
+
+            "contrib": pd.DataFrame(
+            (cpc**2) * column_mass[:, np.newaxis] / singular_values,
+            columns=["Dim1", "Dim2"]
+            ).assign(label=levelnames)[mask].drop(columns=["label"]).reset_index(drop=True),
+
+            "cos2": pd.DataFrame(
+            (cpc**2) / column_distances[:, np.newaxis],  # Usa le distanze calcolate
+            columns=["Dim1", "Dim2"]
+            ).assign(label=levelnames)[mask].drop(columns=["label"]).reset_index(drop=True)
+        }
+
+        # Imposta i nomi delle righe
+        row_names = coord["coord"].index.astype(str).str[:-2]
+        coord["coord"].index = row_names
+        coord["contrib"].index = row_names
+        coord["cos2"].index = row_names
+
+        # Crea la lista `coord_doc`
+        coord_doc = {
+            "coord": pd.DataFrame({
+            "Dim1": rpc[:, 0],
+            "Dim2": rpc[:, 1]
+            }, index=X.index),
+
+            "contrib": pd.DataFrame(
+            (rpc[:, :2]**2) * res_mca.row_masses_.values[:, np.newaxis] / singular_values,
+            columns=["Dim1", "Dim2"]
+            ),
+
+            "cos2": pd.DataFrame(
+            res_mca.row_masses_.values[:, np.newaxis] * rpc**2 / res_mca.total_inertia_,
+            columns=["Dim1", "Dim2"]
+            )
+        }
+
+    elif method == "MDS":
+    # Step 1: NetMatrix = X.T @ X
+        net_matrix = X.T @ X
+
+        # Step 2: Association-based normalization
+        net_matrix_np = net_matrix.to_numpy()
+        row_sums = net_matrix_np.sum(axis=1, keepdims=True)
+        col_sums = net_matrix_np.sum(axis=0, keepdims=True)
+        expected = row_sums @ col_sums / net_matrix_np.sum()
+        norm_matrix = np.divide(net_matrix_np, expected, where=expected != 0)
+        norm_matrix = np.nan_to_num(norm_matrix, nan=0.0, posinf=0.0, neginf=0.0)
+
+        # Step 3: Dissimilarity matrix
+        dissim_matrix = 1 - norm_matrix
+        np.fill_diagonal(dissim_matrix, 0)
+
+        # Step 4: MDS (classical)
+        mds = SK_MDS(n_components=2, dissimilarity="precomputed", random_state=42)
+        coords = mds.fit_transform(dissim_matrix)
+
+        # Normalizza le coordinate (StandardScaler per coerenza visiva)
+        coords = StandardScaler().fit_transform(coords)
+
+        # Crea DataFrame delle coordinate
+        df = pd.DataFrame(coords, columns=["Dim1", "Dim2"], index=X.columns)
+
+        # Clustering sulle coordinate
+        km_res = linkage(pdist(df), method='average')
+
+        if n_clusters == "auto":
+            heights = np.diff(km_res[:, 2])
+            n_clusters = min(len(heights) - np.argmax(heights) + 1, k_max)
+        else:
+            n_clusters = max(1, min(int(n_clusters), k_max))
+
+        cluster_labels = fcluster(km_res, n_clusters, criterion='maxclust')
+        df["cluster"] = cluster_labels
+
+        # Calcolo contribuzione proxy: distanza dal centroide
+        centroids = df.groupby("cluster")[["Dim1", "Dim2"]].transform("mean")
+        df["contrib"] = np.sqrt((df["Dim1"] - centroids["Dim1"])**2 + (df["Dim2"] - centroids["Dim2"])**2)
+        df["contrib"] = (df["contrib"] - df["contrib"].min()) / (df["contrib"].max() - df["contrib"].min()) + 1
+
+        # Autovalori fittizi per etichette (Benzecri style)
+        sv = np.linalg.norm(coords, axis=0)
+        eig_benz = np.where(sv**2 > 1 / len(sv),
+                            ((len(sv) / (len(sv) - 1)) ** 2) * (sv**2 - 1 / len(sv))**2,
+                            0)
+        perc = eig_benz / eig_benz.sum() * 100 if eig_benz.sum() > 0 else np.zeros_like(eig_benz)
+        cum_perc = np.cumsum(perc)
+        eig_corr = pd.DataFrame({
+            "eig": sv**2,
+            "eigBenz": eig_benz,
+            "perc": perc,
+            "cumPerc": cum_perc
+        })
+
+        results = {
+            "res_mca": {"eigCorr": eig_corr, "sv": sv},
+            "df": df,
+            "df_doc": None,
+            "docCoord": None,
+            "coord": None
+        }
+
+        return results
+
+
+    else:
+        raise ValueError(f"Unsupported method: {method}")
+
+    # Blocchi comuni per CA/MCA (non MDS)
+    if method != "MDS":
+        res_mca = eig_correction(res_mca, singular_values)
+
+        docCoord = pd.DataFrame(
+            np.hstack([coord_doc["coord"], coord_doc["contrib"].sum(axis=1).to_numpy()[:, None]]),
+            columns=["dim1", "dim2", "contrib"],
+        ).sort_values(by="contrib", ascending=False)
+
+        res_mca.coord_doc = coord_doc
+
+        results = {
+            "res_mca": res_mca,
+            "df": coord["coord"],
+            "df_doc": coord_doc["coord"],
+            "docCoord": docCoord,
+            "coord": coord,
+        }
+
+    return results
+
+
+def eig_correction(res_mca, singular_values):
+    """
+    Apply Benzecri eigenvalue correction to the results of factorial analysis.
+
+    Args:
+        res_mca: Results of factorial analysis.
+        singular_values: Array or list of singular values from the analysis.
+
+    Returns:
+        Corrected results.
+    """
+    n = len(singular_values)
+    e = np.array(singular_values) ** 2
+    eig_benz = np.where(
+        e > 1 / n,
+        ((n / (n - 1)) ** 2) * (e - (1 / n)) ** 2,
+        0
+    )
+    perc = eig_benz / np.sum(eig_benz) * 100 if np.sum(eig_benz) > 0 else np.zeros_like(eig_benz)
+    cum_perc = np.cumsum(perc)
+
+    eig_corr = pd.DataFrame({
+        "eig": e,
+        "eigBenz": eig_benz,
+        "perc": perc,
+        "cumPerc": cum_perc
+    })
+
+    # Attach eigCorr as attribute or dict entry
+    if hasattr(res_mca, '__dict__'):
+        res_mca.eigCorr = eig_corr
+    else:
+        res_mca['eigCorr'] = eig_corr
+    return res_mca
+
+
+def avoidOverlaps(df, threshold=0.10, dimX=0, dimY=1):
+    """
+    Avoid overlapping labels in a scatter plot.
+
+    Args:
+        df: DataFrame containing the coordinates and labels.
+        threshold: Distance threshold for avoiding overlaps.
+        dimX: Index of the x-coordinate column.
+        dimY: Index of the y-coordinate column.
+
+    Returns:
+        List of labels to remove to avoid overlaps.
+    """
+    df["Dim2"] = df["Dim2"] / 3
+
+    # Filter rows with non-empty labels
+    filtered_df = df[df["labelToPlot"] != ""].copy()
+
+    # Compute Manhattan distances
+    distances = pd.DataFrame(
+        pdist(filtered_df[["Dim1", "Dim2"]], metric="cityblock"),
+        columns=["dist"]
+    )
+    distances["from"] = np.repeat(filtered_df["labelToPlot"].values, len(filtered_df))
+    distances["to"] = np.tile(filtered_df["labelToPlot"].values, len(filtered_df))
+    distances = distances[distances["from"] != distances["to"]]
+
+    # Add dot sizes
+    distances = distances.merge(
+        filtered_df[["labelToPlot", "dotSize"]].rename(columns={"dotSize": "w_from"}),
+        left_on="from",
+        right_on="labelToPlot"
+    ).drop(columns=["labelToPlot"])
+    distances = distances.merge(
+        filtered_df[["labelToPlot", "dotSize"]].rename(columns={"dotSize": "w_to"}),
+        left_on="to",
+        right_on="labelToPlot"
+    ).drop(columns=["labelToPlot"])
+
+    # Filter by threshold
+    distances = distances[distances["dist"] < threshold]
+
+    labels_to_remove = []
+    while not distances.empty:
+        row = distances.iloc[0]
+        if row["w_from"] > row["w_to"]:
+            label = row["to"]
+        else:
+            label = row["from"]
+
+        labels_to_remove.append(label)
+
+        # Remove rows involving the selected label
+        distances = distances[(distances["from"] != label) & (distances["to"] != label)]
+
+    return set(labels_to_remove)
diff --git a/functions/get_filters.py b/functions/get_filters.py
index 206c215aa..d97732b71 100644
--- a/functions/get_filters.py
+++ b/functions/get_filters.py
@@ -12,7 +12,7 @@ def get_filters(df):
     Returns:
         A DataFrame with additional columns for filters and metrics.
     """
-    data = df.get()
+    data = df
 
     # Calculate the minimum and maximum publication years
     data["Min_Year"] = data["PY"].min()
@@ -35,10 +35,11 @@ def get_filters(df):
     cum_freq = SO_counts.cumsum()  # Cumulative frequency of occurrences
 
     # Define cutpoints for Bradford Law Zones
-    cutpoints = np.array([1, n * 0.33, n * 0.67, n + 1]).astype(int)
+    cutpoints = np.unique(np.array([1, n * 0.33, n * 0.67, n + 1]).astype(int))
 
     # Assign zones based on cumulative frequency
-    groups = pd.cut(cum_freq, bins=cutpoints, labels=["Zone 1", "Zone 2", "Zone 3"], right=False)
+    zone_labels = ["Zone 1", "Zone 2", "Zone 3"][:len(cutpoints)-1]
+    groups = pd.cut(cum_freq, bins=cutpoints, labels=zone_labels, right=False, duplicates="drop")
 
     # Create a DataFrame for zones
     zone_df = pd.DataFrame({
diff --git a/functions/get_frequentwords.py b/functions/get_frequentwords.py
index 8d790ffe1..9df016fb8 100644
--- a/functions/get_frequentwords.py
+++ b/functions/get_frequentwords.py
@@ -100,7 +100,7 @@ def table_tag(df, tag, ngrams=1, remove_terms=None, synonyms=None):
     """
     Extract and count words from a specified field in the DataFrame.
     """
-    M = df.get()
+    M = df
     
     # Remove duplicates
     M = M.drop_duplicates(subset='SR')
@@ -109,7 +109,7 @@ def table_tag(df, tag, ngrams=1, remove_terms=None, synonyms=None):
     if tag in ['AB', 'TI']:
         text_data = term_extraction(df, field=tag, stemming=False, verbose=False, 
                                   ngrams=ngrams, remove_terms=remove_terms, synonyms=synonyms)
-        text_data = text_data.get()
+        text_data = text_data
         text_data = text_data[f"{tag}_TM"]
     else:
         text_data = M[tag]
diff --git a/functions/get_historiograph.py b/functions/get_historiograph.py
index 089d02387..5357094d8 100644
--- a/functions/get_historiograph.py
+++ b/functions/get_historiograph.py
@@ -27,7 +27,10 @@ def get_historiograph(df, node_label="AU1", histNodes=20, hist_isolates=True, hi
         filename: nome del file HTML interattivo salvato temporaneamente
     """
     # Pre-elaborazione
-    df = metaTagExtraction(df, "SR")
+    if "SR" not in df.columns or (df["SR"] == "").all():
+        df = metaTagExtraction(df, "SR")
+    df["TC"] = pd.to_numeric(df["TC"], errors="coerce").fillna(0).astype(int)
+    df["PY"] = pd.to_numeric(df["PY"], errors="coerce").fillna(0).astype(int)
     hist_results = histNetwork(df, min_citations=0, sep=sep, network=True)
 
     # 1. Costruzione iniziale del grafo
@@ -41,6 +44,8 @@ def get_historiograph(df, node_label="AU1", histNodes=20, hist_isolates=True, hi
     )
 
     # 2. Recupera layout e rete iniziale
+    if hist_plot is None:
+        return None, None, None
     layout_df = pd.DataFrame(hist_plot["layout"]).copy()
     full_net = hist_plot["net"]
 
@@ -90,7 +95,8 @@ def get_historiograph(df, node_label="AU1", histNodes=20, hist_isolates=True, hi
     # Rimozione Year mancanti
     hist_data = hist_data[hist_data["Year"].notna()].copy()
     if hist_data.empty:
-        raise ValueError("Nessun dato con 'Year' valido per la historiograph.")
+        import plotly.graph_objects as go
+        return go.FigureWidget(), pd.DataFrame(), ""
 
     # Posizionamento temporale orizzontale
     hist_data = hist_data.sort_values(['cluster', 'Year'])
diff --git a/functions/get_historiograph.py.bak b/functions/get_historiograph.py.bak
new file mode 100644
index 000000000..089d02387
--- /dev/null
+++ b/functions/get_historiograph.py.bak
@@ -0,0 +1,213 @@
+from www.services import *
+from pyvis.network import Network
+import tempfile
+import pandas as pd
+import networkx as nx
+import os
+from matplotlib.colors import to_rgba
+
+def hex_to_rgba(hex_color, alpha):
+    if not isinstance(hex_color, str) or not hex_color.startswith("#") or len(hex_color) != 7:
+        hex_color = "#999999"  # fallback grigio neutro
+    try:
+        r, g, b = tuple(int(hex_color.lstrip("#")[i:i+2], 16) for i in (0, 2, 4))
+    except Exception:
+        r, g, b = (153, 153, 153)  # fallback rgb(153,153,153)
+    return f"rgba({r},{g},{b},{alpha})"
+
+
+
+def get_historiograph(df, node_label="AU1", histNodes=20, hist_isolates=True, histlabelsize=3, histsize=4, sep=";"):
+    """
+    Genera la historiograph e ritorna anche un file HTML interattivo con Pyvis.
+
+    Returns:
+        hist_plot: oggetto con layout e grafo networkx
+        hist_data: dataframe con metadati, DOI cliccabili, cluster, anni
+        filename: nome del file HTML interattivo salvato temporaneamente
+    """
+    # Pre-elaborazione
+    df = metaTagExtraction(df, "SR")
+    hist_results = histNetwork(df, min_citations=0, sep=sep, network=True)
+
+    # 1. Costruzione iniziale del grafo
+    hist_plot = histPlot(
+        hist_results,
+        n=histNodes,
+        size=histsize,
+        remove_isolates=False,  # rimozione manuale
+        label=node_label,
+        verbose=False
+    )
+
+    # 2. Recupera layout e rete iniziale
+    layout_df = pd.DataFrame(hist_plot["layout"]).copy()
+    full_net = hist_plot["net"]
+
+    # 3. Filtra archi per mantenere solo quelli con nodi nel top-N
+    selected_nodes = set(full_net.nodes())
+    edges_filtered = [(u, v) for u, v in full_net.edges() if u in selected_nodes and v in selected_nodes]
+
+    # 4. Ricostruisci rete filtrata
+    net_nx = nx.DiGraph()
+    net_nx.add_nodes_from(selected_nodes)
+    net_nx.add_edges_from(edges_filtered)
+
+    # 5. Opzionale: rimuovi componenti isolate
+    if hist_isolates:
+        connected_components = list(nx.connected_components(net_nx.to_undirected()))
+        valid_components = [c for c in connected_components if len(c) > 1]
+        valid_nodes = set().union(*valid_components)
+        net_nx = net_nx.subgraph(valid_nodes).copy()
+    else:
+        valid_nodes = set(net_nx.nodes)
+
+    # 6. Filtra layout
+    layout_df = layout_df[layout_df.index.isin(valid_nodes)].copy()
+    layout_df["name"] = layout_df.index
+    layout_df.reset_index(drop=True, inplace=True)
+
+    # 7. Filtra hist_data in base ai nodi presenti nel grafo
+    hist_data = hist_results["histData"].copy()
+    hist_data = hist_data[hist_data["Paper"].isin(valid_nodes)].copy()
+    hist_data = hist_data.merge(layout_df, left_on="Paper", right_on="name", how="left")
+
+
+    # Cluster da colore
+    if "color" in hist_data.columns:
+        unique_colors = hist_data['color'].dropna().unique()
+        color_to_cluster = {color: idx + 1 for idx, color in enumerate(unique_colors)}
+        hist_data['cluster'] = hist_data['color'].map(color_to_cluster)
+    else:
+        hist_data['color'] = "gray"
+        hist_data['cluster'] = -1
+
+    # Formattazione DOI cliccabile
+    hist_data['DOI'] = hist_data['DOI'].apply(
+        lambda doi: f'<a href="https://doi.org/{doi}" target="_blank">{doi}</a>' if pd.notnull(doi) else ""
+    )
+
+    # Rimozione Year mancanti
+    hist_data = hist_data[hist_data["Year"].notna()].copy()
+    if hist_data.empty:
+        raise ValueError("Nessun dato con 'Year' valido per la historiograph.")
+
+    # Posizionamento temporale orizzontale
+    hist_data = hist_data.sort_values(['cluster', 'Year'])
+    min_year = hist_data["Year"].min()
+    year_range = hist_data["Year"].max() - min_year + 1
+    # Spazio orizzontale compatto
+    hist_data["x"] = (hist_data["Year"] - min_year) * 60  # invece di /year_range * 1000
+
+    # Spazio verticale più ravvicinato tra cluster
+    hist_data["y"] = hist_data["cluster"] * 150 + np.random.uniform(-30, 30, size=len(hist_data))
+
+
+    # Tooltip e label robusti
+    hist_data["tooltip"] = hist_data.apply(
+        lambda row: (
+            f"<b>{str(row.get('Title', 'No Title')).replace('<', '&lt;').replace('>', '&gt;')}</b>"
+            f"<br><b>Year:</b> {row.get('Year', 'n.d.')}"
+            f"<br><b>DOI:</b> {row.get('DOI', '')}"
+            f"<br><b>LCS:</b> {int(row.get('LCS', 0))}"
+            f"<br><b>GCS:</b> {int(row.get('GCS', 0))}"
+        ),
+        axis=1
+    )
+    hist_data["label"] = hist_data.apply(
+        lambda row: str(row.get("Title", "No Title"))[:40] + "..." if len(str(row.get("Title", ""))) > 40 else str(row.get("Title", "No Title")),
+        axis=1
+    )
+
+    # Calcola opacità dinamica e dimensione font
+    min_font_size = 10
+    max_font_size = 130
+    base_font_size = 24  # oppure calcolato in base a metrica
+    font_opacity = np.sqrt((histlabelsize - min_font_size) / (max_font_size - min_font_size)) * 0.8 + 0.3
+    font_opacity = max(0.1, min(1, font_opacity))  # clamp tra 0.1 e 1
+
+
+    # Calcola dimensione proporzionale a LCS
+    if "LCS" in hist_data.columns and not hist_data["LCS"].isnull().all():
+        lcs_min = hist_data["LCS"].min()
+        lcs_max = hist_data["LCS"].max()
+        lcs_range = lcs_max - lcs_min if lcs_max > lcs_min else 1
+        hist_data["node_size"] = hist_data["LCS"].apply(lambda lcs: 10 + ((lcs - lcs_min) / lcs_range) * 10)
+    else:
+        hist_data["node_size"] = histsize
+
+    # Inizializza grafo Pyvis
+    net = Network(height="98vh", width="100%", directed=True, notebook=True, cdn_resources="in_line")
+    net.toggle_physics(False)
+
+    # Aggiungi nodi
+    for _, row in hist_data.iterrows():
+        base_color = row.get("color", "#999999")
+        color_rgba = hex_to_rgba(base_color, 0.8)
+        border_color = hex_to_rgba(base_color, 0.4)
+
+        if node_label == "AU1":
+            label_value = row.get("id", f"{row.get('name', 'unknown')}, {row.get('Year', 'n.d.')}")
+        elif node_label == "TI":
+            label_value = row.get("Title", "No Title")
+        elif node_label == "ID":
+            try:
+                keywords = eval(row.get("Author_Keywords", "[]")) if isinstance(row.get("Author_Keywords"), str) else row.get("Author_Keywords", [])
+                label_value = "; ".join(keywords) if keywords else "No keywords"
+            except:
+                label_value = "No keywords"
+        elif node_label == "DE":
+            try:
+                keywords = eval(row.get("KeywordsPlus", "[]")) if isinstance(row.get("KeywordsPlus"), str) else row.get("KeywordsPlus", [])
+                label_value = "; ".join(keywords) if keywords else "No keywords"
+            except:
+                label_value = "No keywords"
+        else:
+            label_value = "unknown"
+
+        net.add_node(
+            n_id=row["Paper"],
+            label=label_value,
+            title=row["tooltip"],
+            color={
+                "background": color_rgba,
+                "border": border_color,
+                "highlight": {
+                    "background": color_rgba,
+                    "border": "#000000"
+                }
+            },
+            x=row["x"],
+            y=row["y"],
+            size=row["node_size"],
+            font={
+                "size": histlabelsize,
+                "face": "arial",
+                "color": f"rgba(0,0,0,{font_opacity})"
+            },
+            borderWidth=2,
+            borderWidthSelected=3,
+            physics=False,
+            fixed={"x": True, "y": False}  # blocca solo l'asse x
+        )
+
+    # Aggiungi archi con ombreggiatura
+    existing_nodes = set(net.get_nodes())
+    for source, target in net_nx.edges():
+        if source in existing_nodes and target in existing_nodes:
+            source_color = hist_data.loc[hist_data["Paper"] == source, "color"].values[0]
+            edge_color = hex_to_rgba(source_color, 0.4)
+            net.add_edge(source, target, color=edge_color, width=1.5)
+
+    # Salva HTML temporaneo
+    tmp = tempfile.NamedTemporaryFile(delete=False, suffix=".html")
+    html_path = tmp.name
+    with open(html_path, 'w', encoding="utf-8") as f:
+        html = net.generate_html()
+        new_css = "     .card {\n                 border: none;\n             }"
+        updated_html = html.replace("</style>", new_css + "\n        </style>")
+        updated_html = updated_html.replace("1px solid lightgray", "none")
+        
+        f.write(updated_html)
+
+    return hist_plot, hist_data, html_path.split(os.sep)[-1]
diff --git a/functions/get_localcitedauthors.py b/functions/get_localcitedauthors.py
index e663192bc..22dcfef0b 100644
--- a/functions/get_localcitedauthors.py
+++ b/functions/get_localcitedauthors.py
@@ -20,7 +20,7 @@ def get_local_cited_authors(df, num_of_cited_authors, fast_search=False):
         loccit = 1
 
     df = metaTagExtraction(df, "SR")
-    M = df.get()
+    M = df
     
     # Fill missing values
     M['TC'] = M['TC'].fillna(0)
@@ -38,6 +38,7 @@ def get_local_cited_authors(df, num_of_cited_authors, fast_search=False):
     df_authors = pd.DataFrame({'AU': AU, 'LCS': M['LCS'].repeat(n).values})
     author_counts = df_authors.groupby('AU')['LCS'].sum().reset_index()
     author_counts.columns = ["Authors", "N. of Local Citations"]
+    author_counts["N. of Local Citations"] = author_counts["N. of Local Citations"].fillna(0).astype(int)
     author_counts = author_counts.sort_values(by="N. of Local Citations", ascending=False)
     
     # Limit the number of authors to display
@@ -74,7 +75,7 @@ def get_local_cited_authors(df, num_of_cited_authors, fast_search=False):
             y=list(range(len(author_counts))),
             mode="markers+text",
             marker=dict(
-                size=18 + 6 * (author_counts[frequency] / author_counts[frequency].max()),
+                size=18 + 6 * (author_counts[frequency] / author_counts[frequency].max()).fillna(0),
                 color=author_counts[frequency],
                 colorscale=[[0, "#B3D1F2"], [1, "#5567BB"]],
                 line=dict(width=1, color="#E0E0E0"),
diff --git a/functions/get_localcitedauthors.py.bak b/functions/get_localcitedauthors.py.bak
new file mode 100644
index 000000000..a88839335
--- /dev/null
+++ b/functions/get_localcitedauthors.py.bak
@@ -0,0 +1,148 @@
+from www.services import *
+
+
+def get_local_cited_authors(df, num_of_cited_authors, fast_search=False):
+    """
+    Generate a plot and table of the most local cited authors.
+    
+    Args:
+        df: A DataFrame object containing the data.
+        num_of_cited_authors: The number of top cited authors to display.
+        fast_search: Boolean indicating whether to use fast search or not.
+        
+    Returns:
+        A Plotly figure object and a DataFrame of the most local cited authors.
+    """    
+    # Determine the local citation threshold
+    if fast_search:
+        loccit = df['TC'].quantile(0.75)
+    else:
+        loccit = 1
+
+    df = metaTagExtraction(df, "SR")
+    M = df
+    
+    # Fill missing values
+    M['TC'] = M['TC'].fillna(0)
+
+    # Create a histogram network
+    H = histNetwork(df, min_citations=loccit, sep=";", network=False)
+    LCS = H['histData']
+    M = H['M']
+    
+    # Split authors and repeat local citations
+    AU = M['AU'].explode()
+    n = AU.groupby(level=0).size()
+    
+    # Create DataFrame for authors and local citations
+    df_authors = pd.DataFrame({'AU': AU, 'LCS': M['LCS'].repeat(n).values})
+    author_counts = df_authors.groupby('AU')['LCS'].sum().reset_index()
+    author_counts.columns = ["Authors", "N. of Local Citations"]
+    author_counts = author_counts.sort_values(by="N. of Local Citations", ascending=False)
+    
+    # Limit the number of authors to display
+    if num_of_cited_authors > len(author_counts):
+        num_of_cited_authors = len(author_counts)
+    
+    # Truncate author names to 50 characters
+    # author_counts["Authors"] = author_counts["Authors"].str[:50]
+
+    # Prepare the complete table and filter rows for display
+    table_located_authors = author_counts.copy()
+    author_counts = author_counts.head(num_of_cited_authors).reset_index(drop=True)
+
+    # Enhanced, beautiful, and readable plot for local cited authors
+    frequency = "N. of Local Citations"
+    # Create the plot (use scatter instead of scatter with orientation='h')
+    fig = go.Figure()
+
+    # Add a thick line from each label to its marker
+    for i, row in author_counts.iterrows():
+        fig.add_shape(
+            type="line",
+            x0=0,
+            x1=row[frequency],
+            y0=i,
+            y1=i,
+            line=dict(color="#e0e0e0", width=5),
+            layer="below",
+        )
+
+    fig.add_trace(
+        go.Scatter(
+            x=author_counts[frequency],
+            y=list(range(len(author_counts))),
+            mode="markers+text",
+            marker=dict(
+                size=18 + 6 * (author_counts[frequency] / author_counts[frequency].max()),
+                color=author_counts[frequency],
+                colorscale=[[0, "#B3D1F2"], [1, "#5567BB"]],
+                line=dict(width=1, color="#E0E0E0"),
+                opacity=0.95,
+                showscale=False,
+            ),
+            text=author_counts[frequency],
+            textposition="top center",  
+            textfont=dict(color="#5567BB", size=13),  
+            hovertemplate=(
+                "<b>Author:</b> %{customdata}<br>"
+                "<b>" + frequency + ":</b> %{x}<extra></extra>"
+            ),
+            customdata=author_counts["Authors"],
+        )
+    )
+
+    # Add horizontal grid lines for each author (lighter)
+    for i in range(len(author_counts)):
+        fig.add_shape(
+            type="line",
+            x0=0,
+            x1=author_counts[frequency].max(),
+            y0=i,
+            y1=i,
+            line=dict(color="#E0E0E0", width=2),
+            layer="below",
+        )
+
+    # Set x-axis ticks to 0, 5, 10, etc.
+    max_x = author_counts[frequency].max()
+    tick_step = 5
+    x_ticks = list(range(0, int(max_x) + tick_step, tick_step))
+    if x_ticks[-1] < max_x:
+        x_ticks.append(int(max_x))
+
+    fig.update_yaxes(
+        tickvals=list(range(len(author_counts))),
+        ticktext=author_counts["Authors"],
+        autorange="reversed",
+        showgrid=False,
+        title="Authors",
+        tickfont=dict(size=13),
+    )
+    fig.update_xaxes(
+        showgrid=True,
+        gridcolor="#F0F0F0",
+        zeroline=False,
+        tickvals=x_ticks,
+        title=frequency,
+        tickfont=dict(size=13),
+    )
+    fig.update_layout(
+        plot_bgcolor='white',
+        font=dict(color="#222222", size=14, family="Segoe UI, Arial"),
+        margin=dict(l=0, r=0, t=0, b=0),
+        height=50 + 90 * len(author_counts),
+        showlegend=False,
+        hoverlabel=dict(
+            bgcolor="white",
+            font_size=13,
+            font_family="Segoe UI, Arial",
+            bordercolor="#5567BB"
+        ),
+        coloraxis_showscale=False,
+    )
+    fig = go.FigureWidget(fig)
+    fig._config = fig._config | {'modeBarButtonsToRemove': ['pan', 'select', 'lasso2d', 'toImage'],
+                                 'displaylogo': False}
+    
+    return fig, table_located_authors
diff --git a/functions/get_localciteddocuments.py b/functions/get_localciteddocuments.py
index 1dea8d5a5..68e913d2c 100644
--- a/functions/get_localciteddocuments.py
+++ b/functions/get_localciteddocuments.py
@@ -14,7 +14,7 @@ def get_local_cited_documents(df, num_of_local_cited_docs, field_separator, fast
         A Plotly figure object and a DataFrame of the most local cited documents.
     """
     df = metaTagExtraction(df, "SR")
-    M = df.get()
+    M = df
 
     # Determine the local citation threshold
     if fast_search:
@@ -35,8 +35,8 @@ def get_local_cited_documents(df, num_of_local_cited_docs, field_separator, fast
         'Document': M['SR'],
         'DOI': M['DI'],
         'Year': M['PY'],
-        'Local Citations': M['LCS'],
-        'Global Citations': M['TC']
+        'Local Citations': M['LCS'].fillna(0).astype(int),
+        'Global Citations': M['TC'].fillna(0).astype(int)
     })
     
     # Calculate additional metrics
@@ -79,7 +79,7 @@ def get_local_cited_documents(df, num_of_local_cited_docs, field_separator, fast
             y=list(range(len(df_documents))),
             mode="markers+text",
             marker=dict(
-                size=18 + 6 * (df_documents["Local Citations"] / df_documents["Local Citations"].max()),
+                size=18 + 6 * (df_documents["Local Citations"] / df_documents["Local Citations"].max()).fillna(0),
                 color=df_documents["Local Citations"],
                 colorscale=[[0, "#B3D1F2"], [1, "#5567BB"]],
                 line=dict(width=1, color="#E0E0E0"),
diff --git a/functions/get_localciteddocuments.py.bak b/functions/get_localciteddocuments.py.bak
new file mode 100644
index 000000000..f4055504b
--- /dev/null
+++ b/functions/get_localciteddocuments.py.bak
@@ -0,0 +1,155 @@
+from www.services import *
+
+
+def get_local_cited_documents(df, num_of_local_cited_docs, field_separator, fast_search=False):
+    """
+    Generate a plot and table of the most local cited documents.
+    
+    Args:
+        df: A DataFrame object containing the data.
+        num_of_local_cited_docs: The number of top cited documents to display.
+        fast_search: Boolean indicating whether to use fast search or not.
+        
+    Returns:
+        A Plotly figure object and a DataFrame of the most local cited documents.
+    """
+    df = metaTagExtraction(df, "SR")
+    M = df
+
+    # Determine the local citation threshold
+    if fast_search:
+        loccit = M['TC'].quantile(0.75)
+    else:
+        loccit = 1
+    
+    # Fill missing values
+    M['TC'] = M['TC'].fillna(0)
+
+    # Create a histogram network
+    H = histNetwork(df, min_citations=loccit, sep=";", network=False)
+    LCS = H['histData']
+    M = H['M']
+    
+    # Create DataFrame for documents and local citations
+    df_documents = pd.DataFrame({
+        'Document': M['SR'],
+        'DOI': M['DI'],
+        'Year': M['PY'],
+        'Local Citations': M['LCS'],
+        'Global Citations': M['TC']
+    })
+    
+    # Calculate additional metrics
+    df_documents['LC/GC Ratio'] = (df_documents['Local Citations'] / df_documents['Global Citations'] * 100).round(2)
+    
+    # Calculate Normalized Local Citations within each publication year
+    df_documents['Normalized Local Citations'] = df_documents.groupby('Year')['Local Citations'].transform(lambda x: x / x.mean()).round(2)
+
+    # Calculate Normalized Global Citations within each publication year
+    df_documents['Normalized Global Citations'] = df_documents.groupby('Year')['Global Citations'].transform(lambda x: x / x.mean()).round(2)
+    
+    # Sort by local citations
+    df_documents = df_documents.sort_values(by='Local Citations', ascending=False)
+    
+    # Limit the number of documents to display
+    if num_of_local_cited_docs > len(df_documents):
+        num_of_local_cited_docs = len(df_documents)
+    
+    table_located_documents = df_documents.copy()
+    df_documents = df_documents.head(num_of_local_cited_docs)
+    
+    # Create the plot (horizontal scatter with lines, similar to author plot)
+    fig = go.Figure()
+
+    # Add a thick line from each document label to its marker
+    for idx, (i, row) in enumerate(df_documents.iterrows()):
+        fig.add_shape(
+            type="line",
+            x0=0,
+            x1=row["Local Citations"],
+            y0=idx,
+            y1=idx,
+            line=dict(color="#e0e0e0", width=5),
+            layer="below",
+        )
+
+    fig.add_trace(
+        go.Scatter(
+            x=df_documents["Local Citations"],
+            y=list(range(len(df_documents))),
+            mode="markers+text",
+            marker=dict(
+                size=18 + 6 * (df_documents["Local Citations"] / df_documents["Local Citations"].max()),
+                color=df_documents["Local Citations"],
+                colorscale=[[0, "#B3D1F2"], [1, "#5567BB"]],
+                line=dict(width=1, color="#E0E0E0"),
+                opacity=0.95,
+                showscale=False,
+            ),
+            text=df_documents["Local Citations"],
+            textposition="top center",
+            textfont=dict(color="#5567BB", size=13),
+            hovertemplate=(
+                "<b>Document:</b> %{customdata[0]}<br>"
+                "<b>Year:</b> %{customdata[1]}<br>"
+                "<b>Local Citations:</b> %{x}<br>"
+                "<b>Global Citations:</b> %{customdata[2]}<extra></extra>"
+            ),
+            customdata=df_documents[["Document", "Year", "Global Citations"]].values,
+        )
+    )
+
+    # Add horizontal grid lines for each document (lighter)
+    for idx in range(len(df_documents)):
+        fig.add_shape(
+            type="line",
+            x0=0,
+            x1=df_documents["Local Citations"].max(),
+            y0=idx,
+            y1=idx,
+            line=dict(color="#E0E0E0", width=2),
+            layer="below",
+        )
+
+    # Set x-axis ticks to 0, 5, 10, etc.
+    max_x = df_documents["Local Citations"].max()
+    tick_step = 5
+    x_ticks = list(range(0, int(max_x) + tick_step, tick_step))
+    if x_ticks[-1] < max_x:
+        x_ticks.append(int(max_x))
+
+    fig.update_yaxes(
+        tickvals=list(range(len(df_documents))),
+        ticktext=df_documents["Document"],
+        autorange="reversed",
+        showgrid=False,
+        title="Document",
+        tickfont=dict(size=13),
+    )
+    fig.update_xaxes(
+        showgrid=True,
+        gridcolor="#F0F0F0",
+        zeroline=False,
+        tickvals=x_ticks,
+        title="Local Citations",
+        tickfont=dict(size=13),
+    )
+    fig.update_layout(
+        plot_bgcolor='white',
+        font=dict(color="#222222", size=14, family="Segoe UI, Arial"),
+        margin=dict(l=250, r=40, t=40, b=40),
+        height=50 + 90 * len(df_documents),
+        showlegend=False,
+        hoverlabel=dict(
+            bgcolor="white",
+            font_size=13,
+            font_family="Segoe UI, Arial",
+            bordercolor="#5567BB"
+        ),
+        coloraxis_showscale=False,
+    )
+    fig = go.FigureWidget(fig)
+    fig._config = fig._config | {'modeBarButtonsToRemove': ['pan', 'select', 'lasso2d', 'toImage'],
+                                 'displaylogo': False}
+    
+    return fig, table_located_documents
diff --git a/functions/get_localcitedreferences.py b/functions/get_localcitedreferences.py
index 68ea11fef..9bc75cc85 100644
--- a/functions/get_localcitedreferences.py
+++ b/functions/get_localcitedreferences.py
@@ -13,7 +13,7 @@ def get_local_cited_refs(df, num_of_cited_refs, field_separator):
     Returns:
         A Plotly figure object and a DataFrame of the most local cited sources.
     """
-    data = df.get()
+    data = df
     
     if isinstance(data["CR"].iloc[0], list):  # Check if the first element is a list
         # Flatten the 'CR' column containing lists
diff --git a/functions/get_localcitedsources.py b/functions/get_localcitedsources.py
index 74b261455..03843bf72 100644
--- a/functions/get_localcitedsources.py
+++ b/functions/get_localcitedsources.py
@@ -16,7 +16,7 @@ def get_local_cited_sources(df, num_of_cited_sources):
     # Extract metadata tags for cited sources
     df = metaTagExtraction(df, "CR_SO")
 
-    data = df.get()
+    data = df
     
     if isinstance(data["CR_SO"].iloc[0], list):  # Check if the first element is a list
         # Flatten the 'CR_SO' column containing lists
@@ -100,6 +100,7 @@ def wrap_label(label, width=50):
     # Set x-axis ticks to 0, 50, 100, etc.
     max_x = source_counts["N. of Local Citations"].max()
     tick_step = 50
+    max_x = 0 if pd.isna(max_x) else max_x
     x_ticks = list(range(0, int(max_x) + tick_step, tick_step))
     if x_ticks[-1] < max_x:
         x_ticks.append(int(max_x))
diff --git a/functions/get_lotkalaw.py b/functions/get_lotkalaw.py
index 94545fda2..3357be77b 100644
--- a/functions/get_lotkalaw.py
+++ b/functions/get_lotkalaw.py
@@ -1,4 +1,5 @@
 from www.services import *
+import plotly.graph_objects as go
 
 
 def get_lotka_law(df):
@@ -14,7 +15,7 @@ def get_lotka_law(df):
     """
     
     # Calculate Lotka's Law
-    data = df.get()
+    data = df
     
     # Author Productivity (Lotka's Law)
     authors = pd.Series([author.strip() for sublist in data['AU'] for author in sublist])
@@ -24,6 +25,8 @@ def get_lotka_law(df):
     author_prod['Freq'] = author_prod['N.Authors'] / author_prod['N.Authors'].sum()
     
     # Calculate theoretical values
+    if len(author_prod) < 2:
+        return go.Figure(), author_prod
     lotka_law = np.polyfit(np.log10(author_prod['N.Articles']), np.log10(author_prod['Freq']), 1)
     author_prod['Theoretical'] = 10**(lotka_law[1] - 2 * np.log10(author_prod['N.Articles']))
     author_prod['Theoretical'] = author_prod['Theoretical'] / author_prod['Theoretical'].sum()
diff --git a/functions/get_lotkalaw.py.bak b/functions/get_lotkalaw.py.bak
new file mode 100644
index 000000000..af435110a
--- /dev/null
+++ b/functions/get_lotkalaw.py.bak
@@ -0,0 +1,100 @@
+from www.services import *
+
+
+def get_lotka_law(df):
+    """
+    Calculates Lotka's Law for a given dataset and generates a line plot comparing observed and theoretical author productivity distributions.
+
+    Args:
+        df (pd.DataFrame): Dataset containing at least the "AU" (authors) column as lists of author names.
+
+    Returns:
+        fig: Plotly figure showing the observed and theoretical Lotka's Law distributions.
+        author_prod (pd.DataFrame): Table summarizing the number of articles per author and their frequencies.
+    """
+    
+    # Calculate Lotka's Law
+    data = df
+    
+    # Author Productivity (Lotka's Law)
+    authors = pd.Series([author.strip() for sublist in data['AU'] for author in sublist])
+    author_prod = authors.value_counts().reset_index()
+    author_prod.columns = ['Author', 'N.Articles']
+    author_prod = author_prod.groupby('N.Articles').size().reset_index(name='N.Authors')
+    author_prod['Freq'] = author_prod['N.Authors'] / author_prod['N.Authors'].sum()
+    
+    # Calculate theoretical values
+    lotka_law = np.polyfit(np.log10(author_prod['N.Articles']), np.log10(author_prod['Freq']), 1)
+    author_prod['Theoretical'] = 10**(lotka_law[1] - 2 * np.log10(author_prod['N.Articles']))
+    author_prod['Theoretical'] = author_prod['Theoretical'] / author_prod['Theoretical'].sum()
+    
+    # Create the plot with improved hover
+    fig = go.Figure()
+
+    # Observed line
+    fig.add_trace(
+        go.Scatter(
+            x=author_prod['N.Articles'],
+            y=author_prod['Freq'],
+            mode='lines+markers',
+            name='Observed',
+            marker=dict(
+                size=10 + 8 * (author_prod['Freq'] / author_prod['Freq'].max()),
+                color=author_prod['Freq'],
+                colorscale=[[0, "#B3D1F2"], [1, "#5567BB"]],
+                line=dict(width=1, color="#E0E0E0"),
+                opacity=0.95,
+                showscale=False,
+            ),
+            line=dict(color="#5567BB", width=2),
+            hovertemplate=(
+                "<span style='color:white'><b>Documents written:</b> %{x}<br>"
+                "<b>% of Authors:</b> %{y:.2%}<br>"
+                "<b>N. Authors:</b> %{customdata}</span><extra></extra>"
+            ),
+            customdata=author_prod['N.Authors'],
+        )
+    )
+
+    # Theoretical line
+    fig.add_trace(
+        go.Scatter(
+            x=author_prod['N.Articles'],
+            y=author_prod['Theoretical'],
+            mode='lines+markers',
+            name='Theoretical',
+            marker=dict(
+                size=10,
+                color="#888888",
+                line=dict(width=1, color="#E0E0E0"),
+                opacity=0.7,
+            ),
+            line=dict(dash='dash', color='black', width=2),
+            hovertemplate=(
+                "<span style='color:white'><b>Documents written:</b> %{x}<br>"
+                "<b>Theoretical % of Authors:</b> %{y:.2%}</span><extra></extra>"
+            ),
+        )
+    )
+
+    # Customize the layout
+    fig.update_layout(
+        xaxis_title='Documents written',
+        yaxis_title='% of Authors',
+        plot_bgcolor='white',
+        title_font_size=24,
+        font=dict(color="#444444"),
+        margin=dict(l=40, r=40, t=40, b=40),
+        legend=dict(orientation='h', yanchor='bottom', y=1.02, xanchor='center', x=0.5),
+        height=600,
+    )
+
+    # Customize the grid
+    fig.update_xaxes(showgrid=True, gridwidth=1, gridcolor='#EFEFEF')
+    fig.update_yaxes(showgrid=True, gridwidth=1, gridcolor='#EFEFEF', tickformat=".0%")
+
+    fig = go.FigureWidget(fig)
+    fig._config = fig._config | {'modeBarButtonsToRemove': ['pan', 'select', 'lasso2d', 'toImage'],
+                                 'displaylogo': False}
+    
+    return fig, author_prod
diff --git a/functions/get_maininformations.py b/functions/get_maininformations.py
index 97443abdb..00f11e590 100644
--- a/functions/get_maininformations.py
+++ b/functions/get_maininformations.py
@@ -12,7 +12,7 @@ def get_main_informations(df, log=False):
     Returns:
         A DataFrame with additional columns for filters and metrics.
     """
-    data = df.get()
+    data = df
 
     #### Min and Max Year ####
     start_time = time.time()
@@ -99,7 +99,7 @@ def count_authors(entry):
     if "AU_CO" not in data.columns:
         # Extract the required metadata
         df = metaTagExtraction(df, "AU_CO")
-        data = df.get()
+        data = df
         
     # Calculate "Country_Count" with a vectorized function
     data["Country_Count"] = data["AU_CO"].apply(lambda x: len(set(x)))
diff --git a/functions/get_referencesspectroscopy.py b/functions/get_referencesspectroscopy.py
index a2c3e1522..59dae6228 100644
--- a/functions/get_referencesspectroscopy.py
+++ b/functions/get_referencesspectroscopy.py
@@ -16,7 +16,7 @@ def get_references_spectroscopy(df, start_year, end_year=2005, field_separator_s
         rpys_table (pd.DataFrame): Table with RPYS data (years, citations, deviation from median, top references).
         cr_table (pd.DataFrame): Table of cited references with local citation counts and Google Scholar links.
     """
-    df = df.get()
+    df = df
 
     # Pulizia e preparazione dei dati
     c_references = df['CR'].apply(lambda x: [i for i in x]).explode()
@@ -32,10 +32,11 @@ def get_references_spectroscopy(df, start_year, end_year=2005, field_separator_s
     # Ripetere gli anni per ogni riferimento citato
     references_len = references.str.len()
     references = references[references_len > 0]
-    cited_years = references.apply(lambda refs: [int(re.findall(r'\b\d{4},', ref)[0][:-1]) if re.findall(r'\b\d{4},', ref) else 0 for ref in refs]).explode().astype(int).reset_index(drop=True)
+    cited_years = references.apply(lambda refs: [int(re.findall(r"\b\d{4},", ref)[0][:-1]) if re.findall(r"\b\d{4},", ref) else 0 for ref in refs]).explode().astype(int).reset_index(drop=True)
     references = references.explode().reset_index(drop=True)
 
     # Creazione del DataFrame delle citazioni
+    if cited_years.eq(0).all(): return None, None, None
     ref_df = pd.DataFrame({'Reference': references, 'CitedYear': cited_years})
 
     # Filtraggio per intervallo temporale
@@ -50,7 +51,9 @@ def get_references_spectroscopy(df, start_year, end_year=2005, field_separator_s
 
     # Aggiunta degli anni mancanti
     year_seq = rpys_table['CitedYear']
-    missing_years = set(range(year_seq.min(), year_seq.max() + 1)) - set(year_seq)
+    year_seq = year_seq.dropna().astype(int)
+    if len(year_seq) == 0: return None, None, None
+    missing_years = set(range(int(year_seq.min()), int(year_seq.max()) + 1)) - set(year_seq)
     missing_years_df = pd.DataFrame({'CitedYear': list(missing_years), 'Citations': [0] * len(missing_years)})
     rpys_table = pd.concat([rpys_table, missing_years_df]).sort_values('CitedYear').reset_index(drop=True)
 
diff --git a/functions/get_relevantaffiliations.py b/functions/get_relevantaffiliations.py
index b86e36509..47bee1200 100644
--- a/functions/get_relevantaffiliations.py
+++ b/functions/get_relevantaffiliations.py
@@ -13,7 +13,7 @@ def get_relevant_affiliations(df, num_of_affiliations, disambiguation):
     Returns:
         A Plotly figure object and a DataFrame of the most relevant authors.
     """
-    data = df.get()
+    data = df
 
     if disambiguation == "yes":
         # Extract affiliations from the "AU_UN" field
diff --git a/functions/get_relevantauthors.py b/functions/get_relevantauthors.py
index cdf960151..a160ae647 100644
--- a/functions/get_relevantauthors.py
+++ b/functions/get_relevantauthors.py
@@ -13,7 +13,7 @@ def get_relevant_authors(df, num_of_authors, frequency="N. of Documents"):
     Returns:
         A Plotly figure object and a DataFrame of the most relevant authors.
     """
-    data = df.get()
+    data = df
 
     # Drop rows with missing values
     data = data.dropna(subset=["AU"])
@@ -104,6 +104,7 @@ def get_relevant_authors(df, num_of_authors, frequency="N. of Documents"):
 
     # Set x-axis ticks to 0, 5, 10, etc.
     max_x = author_counts[frequency].max()
+    max_x = 0 if pd.isna(max_x) else max_x
     tick_step = 5
     x_ticks = list(range(0, int(max_x) + tick_step, tick_step))
     if x_ticks[-1] < max_x:
diff --git a/functions/get_relevantsources.py b/functions/get_relevantsources.py
index dccd8d3e5..e54df2361 100644
--- a/functions/get_relevantsources.py
+++ b/functions/get_relevantsources.py
@@ -12,7 +12,7 @@ def get_relevant_sources(df, num_of_sources):
     Returns:
         A Plotly figure object and a DataFrame of the most relevant sources.
     """
-    data = df.get()
+    data = df
 
     # Drop rows with missing values
     data = data.dropna(subset=["SO"])
diff --git a/functions/get_sourceslocalimpact.py b/functions/get_sourceslocalimpact.py
index 731c97194..b973ed65d 100644
--- a/functions/get_sourceslocalimpact.py
+++ b/functions/get_sourceslocalimpact.py
@@ -13,7 +13,7 @@ def get_sources_local_impact(df, num_of_sources_local_impact, source_local_impac
     Returns:
         A Plotly figure object and a DataFrame of the most impactful sources.
     """
-    df = df.get()
+    df = df
     today = pd.Timestamp.now().year
 
     # Ensure 'TC' and 'PY' are numeric
diff --git a/functions/get_sourcesproduction.py b/functions/get_sourcesproduction.py
index 0795668d7..6d1805d4f 100644
--- a/functions/get_sourcesproduction.py
+++ b/functions/get_sourcesproduction.py
@@ -13,7 +13,7 @@ def get_sources_production(df, num_of_sources_production, occurences):
     Returns:
         A Plotly figure object representing the sources' production over time.
     """
-    data = df.get()
+    data = df
 
     # Calculate the number of publications per year for each source
     WSO = cocMatrix(df, Field="SO")
diff --git a/functions/get_table.py b/functions/get_table.py
index 75b9c91d8..a24d63da4 100644
--- a/functions/get_table.py
+++ b/functions/get_table.py
@@ -67,6 +67,12 @@ def create_plotly_table(sorted_columns, dpi=300):
 
 # Function to generate and display the completeness table for bibliographic metadata
 def get_table(database, df, dpi=300, filter=False, modal=True):
+    import pandas as pd
+    if not isinstance(df, pd.DataFrame):
+        try:
+            df = df.get()
+        except AttributeError:
+            df = df()
     """
     Display a table showing the completeness of bibliographic metadata.
 
@@ -79,7 +85,7 @@ def get_table(database, df, dpi=300, filter=False, modal=True):
         A DataTable object if data is available, otherwise a message indicating no data.
     """
     # Retrieve the data from the DataFrame
-    data = df.get()
+    data = df
 
     table_html = ""
     fig = None
@@ -205,7 +211,7 @@ def get_table(database, df, dpi=300, filter=False, modal=True):
         # Return a DataTable object with the data and the HTML/Plotly tables
         return ui.HTML(
             DT(
-                df.get(),
+                df,
                 maxBytes="10MB",
                 classes="display compact stripe",
                 style="text-transform: uppercase; font-size: small; table-layout: auto;",
diff --git a/functions/get_thematicevolution.py b/functions/get_thematicevolution.py
index 65bb0077b..2f1580cf5 100644
--- a/functions/get_thematicevolution.py
+++ b/functions/get_thematicevolution.py
@@ -70,8 +70,8 @@ def get_thematic_evolution(df, field="ID", years=None, n=250, weight_index="inc_
     # Prepara la tabella di evoluzione tematica
     thematic_table = results["Data"].copy()
     thematic_table = thematic_table.rename(columns={
-        "Cluster_Label.x": "From",
-        "Cluster_Label.y": "To",
+        "Cluster_Label_x": "From",
+        "Cluster_Label_y": "To",
         "Words": "Words",
         "Inc_Weighted": "Weighted Inclusion Index",
         "Inc_index": "Inclusion Index",
@@ -94,7 +94,7 @@ def thematic_evolution(M, field="ID", years=None, n=250, min_freq=2, size=0.5, n
 
     for interval_label, Mk in list_df.items():
         Y.append(f"{min(Mk['PY'])}-{max(Mk['PY'])}")
-        Mk = reactive.Value(Mk)
+
         resk_tuple = thematic_map(
             Mk,
             field=field, n=n, minfreq=min_freq, ngrams=ngrams,
@@ -156,34 +156,34 @@ def append_period(label, period):
         res2['clusters']['label'] = res2['clusters']['Cluster'].apply(lambda x: append_period(x, Y[k]))
 
         # Step 1: Add len and tot columns to clusters
-        cluster1 = res1['words'].groupby('Cluster_Label').apply(lambda x: x.assign(
-            len=len(x), tot=x['Occurrences'].sum()
-        )).reset_index(drop=True)
-        cluster2 = res2['words'].groupby('Cluster_Label').apply(lambda x: x.assign(
-            len=len(x), tot=x['Occurrences'].sum()
-        )).reset_index(drop=True)
+        cluster1 = res1['words'].copy()
+        cluster1['len'] = cluster1.groupby('Cluster_Label')['Occurrences'].transform('count')
+        cluster1['tot'] = cluster1.groupby('Cluster_Label')['Occurrences'].transform('sum')
+        cluster2 = res2['words'].copy()
+        cluster2['len'] = cluster2.groupby('Cluster_Label')['Occurrences'].transform('count')
+        cluster2['tot'] = cluster2.groupby('Cluster_Label')['Occurrences'].transform('sum')
 
         # Step 2: Inner join on Words
-        A = pd.merge(cluster1, cluster2, on="Words", suffixes=(".x", ".y"))
+        A = pd.merge(cluster1, cluster2, on="Words", suffixes=("_x", "_y"))
 
         # Step 3: For each pair of clusters, compute min, Occ, tot
-        A['min'] = A[['Occurrences.x', 'Occurrences.y']].min(axis=1)
-        A['Occ'] = A['Occurrences.x']
-        A['tot'] = A[['tot.x', 'tot.y']].min(axis=1)
+        A['min'] = A[['Occurrences_x', 'Occurrences_y']].min(axis=1)
+        A['Occ'] = A['Occurrences_x']
+        A['tot'] = A[['tot_x', 'tot_y']].min(axis=1)
 
         # Step 4: Group and summarize as in R
         B = (
-            A.groupby(['Cluster_Label.x', 'Cluster_Label.y'])
+            A.groupby(['Cluster_Label_x', 'Cluster_Label_y'])
             .apply(lambda row: pd.Series({
-            "CL1": row['Cluster.x'].iloc[0],
-            "CL2": row['Cluster.y'].iloc[0],
+            "CL1": row['Cluster_x'].iloc[0],
+            "CL2": row['Cluster_y'].iloc[0],
             "Words": ";".join(row['Words']),
             "sum": row['min'].sum(),
             "Inc_Weighted": row['min'].sum() / row['tot'].min() if row['tot'].min() > 0 else 0,
-            "Inc_index": len(row['Words']) / min(row['len.x'].iloc[0], row['len.y'].iloc[0]) if min(row['len.x'].iloc[0], row['len.y'].iloc[0]) > 0 else 0,
+            "Inc_index": len(row['Words']) / min(row['len_x'].iloc[0], row['len_y'].iloc[0]) if min(row['len_x'].iloc[0], row['len_y'].iloc[0]) > 0 else 0,
             "Occ": row['Occ'].iloc[0],
             "Tot": row['tot'].iloc[0],
-            "Stability": len(row['Words']) / (row['len.x'].iloc[0] + row['len.y'].iloc[0] - len(row['Words'])) if (row['len.x'].iloc[0] + row['len.y'].iloc[0] - len(row['Words'])) > 0 else 0
+            "Stability": len(row['Words']) / (row['len_x'].iloc[0] + row['len_y'].iloc[0] - len(row['Words'])) if (row['len_x'].iloc[0] + row['len_y'].iloc[0] - len(row['Words'])) > 0 else 0
             }))
             .reset_index()
         )
@@ -198,10 +198,10 @@ def append_period(label, period):
         INC = pd.concat(inc_matrix, ignore_index=True)
 
         # Edges dataframe
-        edges = INC[['Cluster_Label.x', 'Cluster_Label.y', 'Inc_index', 'Inc_Weighted', 'Stability']].copy()
+        edges = INC[['Cluster_Label_x', 'Cluster_Label_y', 'Inc_index', 'Inc_Weighted', 'Stability']].copy()
 
         # Nodes dataframe
-        unique_labels = pd.unique(edges[['Cluster_Label.x', 'Cluster_Label.y']].values.ravel())
+        unique_labels = pd.unique(edges[['Cluster_Label_x', 'Cluster_Label_y']].values.ravel())
         nodes = pd.DataFrame({'name': unique_labels})
         nodes['group'] = nodes['name']
 
@@ -211,8 +211,8 @@ def append_period(label, period):
 
         # Map cluster labels to node IDs for 'from' and 'to'
         label_to_id = dict(zip(nodes['name'], nodes['id']))
-        edges['from'] = edges['Cluster_Label.x'].map(label_to_id)
-        edges['to'] = edges['Cluster_Label.y'].map(label_to_id)
+        edges['from'] = edges['Cluster_Label_x'].map(label_to_id)
+        edges['to'] = edges['Cluster_Label_y'].map(label_to_id)
 
         # Rename columns as in R
         edges = edges.rename(columns={
@@ -310,7 +310,7 @@ def timeslice(M, breaks=None, k=5):
     Returns:
         dict: Dictionary containing DataFrames for each sub-period.
     """
-    M = M.get()
+    M = M
 
     # Convert the 'PY' column to numeric
     M['PY'] = pd.to_numeric(M['PY'], errors='coerce')
@@ -319,7 +319,9 @@ def timeslice(M, breaks=None, k=5):
     if breaks is None or (isinstance(breaks, list) and len(breaks) == 0):
         breaks = np.floor(np.linspace(M['PY'].min() - 1, M['PY'].max(), k + 1))
     else:
-        breaks = [M['PY'].min() - 1] + breaks + [M['PY'].max()]
+        py_min = M['PY'].min()
+        py_max = M['PY'].max()
+        breaks = sorted(set([py_min - 1] + [b for b in breaks if py_min <= b <= py_max] + [py_max + 1]))
 
     # print("breaks:", breaks)
     
diff --git a/functions/get_thematicmap.py b/functions/get_thematicmap.py
index 68d1f37d6..64bf52ace 100644
--- a/functions/get_thematicmap.py
+++ b/functions/get_thematicmap.py
@@ -25,10 +25,12 @@ def get_thematic_map(df, field="ID", n=250, minfreq=5, ngrams=1, stemming=False,
         A tuple containing the HTML file name and a DataFrame with the extracted terms.
     """
     
-    map, graph_path, words, clusters, documentToClusters = thematic_map(
+    result = thematic_map(
         df, field=field, n=n, minfreq=minfreq, ngrams=ngrams, stemming=stemming, size=size,
         n_labels=n_labels, community_repulsion=community_repulsion, repel=repel,
         remove_terms=remove_terms, synonyms=synonyms, cluster=cluster, subgraphs=subgraphs
     )
-    
+    if result is None:
+        return None, None, None, None, None
+    map, graph_path, words, clusters, documentToClusters = result
     return map, graph_path, words, clusters, documentToClusters
diff --git a/functions/get_treemap.py b/functions/get_treemap.py
index 1f3f765f0..2db1ca28b 100644
--- a/functions/get_treemap.py
+++ b/functions/get_treemap.py
@@ -75,7 +75,7 @@ def table_tag(df, tag, ngrams=1, remove_terms=None, synonyms=None):
     """
     Extract and count words from a specified field in the DataFrame.
     """
-    M = df.get()
+    M = df
     
     # Remove duplicates
     M = M.drop_duplicates(subset='SR')
diff --git a/functions/get_trendtopics.py b/functions/get_trendtopics.py
index 1d2f1df3a..7f2cecb96 100644
--- a/functions/get_trendtopics.py
+++ b/functions/get_trendtopics.py
@@ -2,117 +2,81 @@
 
 
 def get_trend_topics(df, ngram, field_tt, time_window, file_upload_terms_tt, file_upload_synonyms_tt, word_minimum_frequency, number_of_words_year):
-    """
-    Generate a plot of trend topics over time.
-
-    Args:
-        df: A DataFrame object containing the data.
-        ngram: The number of n-grams to consider.
-        field_tt: The field to analyze for trend topics.
-        time_window: The time window to consider.
-        file_upload_terms_tt: File containing terms to remove.
-        file_upload_synonyms_tt: File containing synonyms.
-        word_minimum_frequency: The minimum frequency of words to consider.
-        number_of_words_year: The number of words to display per year.
-
-    Returns:
-        A Plotly figure object representing the trend topics over time.
-    """
-    
-    # Load terms to remove
     remove_terms = None
     if file_upload_terms_tt:
         with open(file_upload_terms_tt[0]['datapath'], 'r', encoding='utf-8') as file:
             remove_terms = [line.strip() for line in file]
 
-    # Load synonyms
     synonyms = None
     if file_upload_synonyms_tt:
         with open(file_upload_synonyms_tt[0]['datapath'], 'r', encoding='utf-8') as file:
             synonyms = {}
             for line in file:
                 terms = [term.strip() for term in line.split(',')]
-                key = terms[0]
-                values = terms[1:]
-                synonyms[key] = values
+                synonyms[terms[0]] = terms[1:]
 
-    # Set ngrams based on word_type
     ngrams = int(ngram) if field_tt in ['TI', 'AB'] else 1
 
-    # Extract terms
     if field_tt in ["TI", "AB"]:
-        df = term_extraction(df, field=field_tt, stemming=False, verbose=False, 
-                            ngrams=ngrams, remove_terms=remove_terms, synonyms=synonyms)
+        df = term_extraction(df, field=field_tt, stemming=False, verbose=False,
+                             ngrams=ngrams, remove_terms=remove_terms, synonyms=synonyms)
         field = f"{field_tt}_TM"
     else:
         field = field_tt
 
-    # Get trend topics
     trend_topics = field_by_year(df, field, time_window, word_minimum_frequency, number_of_words_year, remove_terms, synonyms)
 
-    # Plot
-    fig = px.scatter(trend_topics, x='year_med', y='item', size='freq', hover_data=['year_q1', 'year_q3'], height=800)
+    if trend_topics.empty:
+        return go.FigureWidget(), trend_topics
+
+    fig = px.scatter(trend_topics, x='year_med', y='item', size='freq',
+                     hover_data=['year_q1', 'year_q3'], height=800)
     fig.update_layout(
-        xaxis_title='Year', 
-        yaxis_title='Term', 
-        showlegend=False, 
+        xaxis_title='Year', yaxis_title='Term', showlegend=False,
         plot_bgcolor='white',
         xaxis=dict(showgrid=False),
         yaxis=dict(showgrid=True, gridcolor='lightgrey'),
-        hoverlabel=dict(
-            bgcolor="white",
-            font_size=13,
-            font_family="Segoe UI, Arial",
-            bordercolor="#5567BB"
-        ),
     )
-    fig.update_traces(
-        hovertemplate=
-            "<b>Term:</b> %{y}<br>" +
-            "<b>Median Year:</b> %{x}<br>" +
-            "<b>Frequency:</b> %{marker.size}<br>" +
-            "<b>Q1 Year:</b> %{customdata[0]}<br>" +
-            "<b>Q3 Year:</b> %{customdata[1]}<br>" +
-            "<extra></extra>",
-        customdata=trend_topics[['year_q1', 'year_q3']].values
-    )
-
     for i in range(len(trend_topics)):
         fig.add_shape(
             type='line',
-            x0=trend_topics['year_q1'].iloc[i], 
-            y0=trend_topics['item'].iloc[i],
-            x1=trend_topics['year_q3'].iloc[i], 
-            y1=trend_topics['item'].iloc[i],
-            line=dict(color='lightblue', width=5),  # Adjust width proportionallyù
-            layer='below'
+            x0=trend_topics['year_q1'].iloc[i], y0=trend_topics['item'].iloc[i],
+            x1=trend_topics['year_q3'].iloc[i], y1=trend_topics['item'].iloc[i],
+            line=dict(color='lightblue', width=5), layer='below'
         )
-
-    fig.update_traces(marker=dict(color='dodgerblue', opacity=1), selector=dict(mode='markers'))  # Ensure no opacity and bring to front
+    fig.update_traces(marker=dict(color='dodgerblue', opacity=1), selector=dict(mode='markers'))
     fig = go.FigureWidget(fig)
-    fig._config = fig._config | {'modeBarButtonsToRemove': ['pan', 'select', 'lasso2d', 'toImage'],
-                                 'displaylogo': False}
-
+    fig._config = fig._config | {'modeBarButtonsToRemove': ['pan', 'select', 'lasso2d', 'toImage'], 'displaylogo': False}
     return fig, trend_topics
 
+
 def field_by_year(df, field, timespan, min_freq, n_items, remove_terms=None, synonyms=None):
-    # Create co-occurrence matrix
     A = cocMatrix(df, Field=field, binary=False, remove_terms=remove_terms, synonyms=synonyms)
-    n = A.sum(axis=0).to_numpy()  # Convert to 1D array
-    df = df.get()
-
-    # Calculate quantiles
-    trend_med = pd.DataFrame(A.values).apply(lambda x: pd.Series(np.round(np.quantile(np.repeat(df['PY'], x), [0.25, 0.5, 0.75]))), axis=0).T
-    trend_med.columns = ['year_q1', 'year_med', 'year_q3']
-    trend_med['freq'] = n
-    trend_med['item'] = A.columns
-
-    # Filter by timespan and frequency
-    if timespan is None or len(timespan) != 2:
+    py_values = df['PY'].to_numpy()
+
+    records = []
+    for col in A.columns:
+        counts = A[col].values
+        repeated = []
+        for py, cnt in zip(py_values, counts):
+            repeated.extend([py] * int(cnt))
+        repeated = np.array(repeated)
+        if len(repeated) == 0:
+            records.append([0.0, 0.0, 0.0])
+        else:
+            q = np.round(np.quantile(repeated, [0.25, 0.5, 0.75]))
+            records.append(q.tolist())
+
+    trend_med = pd.DataFrame(records, columns=['year_q1', 'year_med', 'year_q3'])
+    trend_med['freq'] = A.sum(axis=0).to_numpy()
+    trend_med['item'] = A.columns.tolist()
+
+    if timespan is None or not hasattr(timespan, "__len__") or len(timespan) != 2:
         timespan = [trend_med['year_med'].min(), trend_med['year_med'].max()]
 
     trend_med = trend_med[(trend_med['year_med'] >= timespan[0]) & (trend_med['year_med'] <= timespan[1])]
     trend_med = trend_med[trend_med['freq'] >= min_freq]
-    trend_med = trend_med.groupby('year_med').apply(lambda x: x.nlargest(n_items, 'freq')).reset_index(drop=True)
-
+    if trend_med.empty:
+        return trend_med
+    trend_med = trend_med.sort_values('freq', ascending=False).groupby('year_med', group_keys=False).head(n_items).reset_index(drop=True)
     return trend_med
diff --git a/functions/get_trendtopics.py.bak b/functions/get_trendtopics.py.bak
new file mode 100644
index 000000000..2739dc50d
--- /dev/null
+++ b/functions/get_trendtopics.py.bak
@@ -0,0 +1,82 @@
+from www.services import *
+
+
+def get_trend_topics(df, ngram, field_tt, time_window, file_upload_terms_tt, file_upload_synonyms_tt, word_minimum_frequency, number_of_words_year):
+    remove_terms = None
+    if file_upload_terms_tt:
+        with open(file_upload_terms_tt[0]['datapath'], 'r', encoding='utf-8') as file:
+            remove_terms = [line.strip() for line in file]
+
+    synonyms = None
+    if file_upload_synonyms_tt:
+        with open(file_upload_synonyms_tt[0]['datapath'], 'r', encoding='utf-8') as file:
+            synonyms = {}
+            for line in file:
+                terms = [term.strip() for term in line.split(',')]
+                synonyms[terms[0]] = terms[1:]
+
+    ngrams = int(ngram) if field_tt in ['TI', 'AB'] else 1
+
+    if field_tt in ["TI", "AB"]:
+        df = term_extraction(df, field=field_tt, stemming=False, verbose=False,
+                             ngrams=ngrams, remove_terms=remove_terms, synonyms=synonyms)
+        field = f"{field_tt}_TM"
+    else:
+        field = field_tt
+
+    trend_topics = field_by_year(df, field, time_window, word_minimum_frequency, number_of_words_year, remove_terms, synonyms)
+
+    if trend_topics.empty:
+        return go.FigureWidget(), trend_topics
+
+    fig = px.scatter(trend_topics, x='year_med', y='item', size='freq',
+                     hover_data=['year_q1', 'year_q3'], height=800)
+    fig.update_layout(
+        xaxis_title='Year', yaxis_title='Term', showlegend=False,
+        plot_bgcolor='white',
+        xaxis=dict(showgrid=False),
+        yaxis=dict(showgrid=True, gridcolor='lightgrey'),
+    )
+    for i in range(len(trend_topics)):
+        fig.add_shape(
+            type='line',
+            x0=trend_topics['year_q1'].iloc[i], y0=trend_topics['item'].iloc[i],
+            x1=trend_topics['year_q3'].iloc[i], y1=trend_topics['item'].iloc[i],
+            line=dict(color='lightblue', width=5), layer='below'
+        )
+    fig.update_traces(marker=dict(color='dodgerblue', opacity=1), selector=dict(mode='markers'))
+    fig = go.FigureWidget(fig)
+    fig._config = fig._config | {'modeBarButtonsToRemove': ['pan', 'select', 'lasso2d', 'toImage'], 'displaylogo': False}
+    return fig, trend_topics
+
+
+def field_by_year(df, field, timespan, min_freq, n_items, remove_terms=None, synonyms=None):
+    A = cocMatrix(df, Field=field, binary=False, remove_terms=remove_terms, synonyms=synonyms)
+    py_values = df['PY'].to_numpy()
+
+    records = []
+    for col in A.columns:
+        counts = A[col].values
+        repeated = []
+        for py, cnt in zip(py_values, counts):
+            repeated.extend([py] * int(cnt))
+        repeated = np.array(repeated)
+        if len(repeated) == 0:
+            records.append([0.0, 0.0, 0.0])
+        else:
+            q = np.round(np.quantile(repeated, [0.25, 0.5, 0.75]))
+            records.append(q.tolist())
+
+    trend_med = pd.DataFrame(records, columns=['year_q1', 'year_med', 'year_q3'])
+    trend_med['freq'] = A.sum(axis=0).to_numpy()
+    trend_med['item'] = A.columns.tolist()
+
+    if timespan is None or len(timespan) != 2:
+        timespan = [trend_med['year_med'].min(), trend_med['year_med'].max()]
+
+    trend_med = trend_med[(trend_med['year_med'] >= timespan[0]) & (trend_med['year_med'] <= timespan[1])]
+    trend_med = trend_med[trend_med['freq'] >= min_freq]
+    if trend_med.empty:
+        return trend_med
+    trend_med = trend_med.sort_values('freq', ascending=False).groupby('year_med', group_keys=False).head(n_items).reset_index(drop=True)
+    return trend_med
diff --git a/functions/get_wordcloud.py b/functions/get_wordcloud.py
index e902f3bd6..3d84a19af 100644
--- a/functions/get_wordcloud.py
+++ b/functions/get_wordcloud.py
@@ -106,7 +106,7 @@ def table_tag(df, tag, ngrams=1, remove_terms=None, synonyms=None):
     """
     Extract and count words from a specified field in the DataFrame.
     """
-    M = df.get()
+    M = df
     
     # Remove duplicates
     M = M.drop_duplicates(subset='SR')
diff --git a/functions/get_wordfrequency.py b/functions/get_wordfrequency.py
index 1f2b81a06..4592a516f 100644
--- a/functions/get_wordfrequency.py
+++ b/functions/get_wordfrequency.py
@@ -34,12 +34,15 @@ def get_word_frequency(df, ngram, field_wf, file_upload_terms_wf, file_upload_sy
                 values = terms[1:]
                 synonyms[key] = values
 
+    # Normalize top_words to list if scalar
+    if not hasattr(top_words, "__len__"):
+        top_words = [0, int(top_words)]
     # Set ngrams based on word_type
     ngrams = int(ngram) if field_wf in ['TI', 'AB'] else 1
 
     data = term_extraction(df, field=field_wf, stemming=False, verbose=False, 
                                 ngrams=ngrams, remove_terms=remove_terms, synonyms=synonyms)
-    data = data.get()
+    data = data
     if field_wf == 'TI':
         print(data[f"{field_wf}_TM"])
 
@@ -54,6 +57,7 @@ def get_word_frequency(df, ngram, field_wf, file_upload_terms_wf, file_upload_sy
     word_freq = word_freq[['Year'] + word_freq.columns[top_words[0]:top_words[1] + 1].tolist()]
     
     # Reshape the data for plotting
+    word_freq = word_freq.loc[:, ~word_freq.columns.duplicated()]
     word_freq_melted = word_freq.melt(id_vars=['Year'], var_name='Term', value_name='Frequency')
 
     # Create the plot
diff --git a/functions/get_wordfrequency.py.bak b/functions/get_wordfrequency.py.bak
new file mode 100644
index 000000000..7332dd31e
--- /dev/null
+++ b/functions/get_wordfrequency.py.bak
@@ -0,0 +1,163 @@
+from www.services import *
+
+
+def get_word_frequency(df, ngram, field_wf, file_upload_terms_wf, file_upload_synonyms_wf, occurrences, top_words):
+    """
+    Generate a plot of word frequency over time.
+
+    Args:
+        df: A DataFrame object containing the data.
+        ngram: The number of n-grams to consider.
+        field_wf: The field to analyze for word frequency.
+        file_upload_terms_wf: File containing terms to remove.
+        file_upload_synonyms_wf: File containing synonyms.
+        occurrences: Type of occurrences ('cumulate' or 'per_year').
+        top_words: The number of top words to display.
+
+    Returns:
+        A Plotly figure object representing the word frequency over time.
+    """
+    # Load terms to remove
+    remove_terms = None
+    if file_upload_terms_wf:
+        with open(file_upload_terms_wf[0]['datapath'], 'r', encoding='utf-8') as file:
+            remove_terms = [line.strip() for line in file]
+
+    # Load synonyms
+    synonyms = None
+    if file_upload_synonyms_wf:
+        with open(file_upload_synonyms_wf[0]['datapath'], 'r', encoding='utf-8') as file:
+            synonyms = {}
+            for line in file:
+                terms = [term.strip() for term in line.split(',')]
+                key = terms[0]
+                values = terms[1:]
+                synonyms[key] = values
+
+    # Set ngrams based on word_type
+    ngrams = int(ngram) if field_wf in ['TI', 'AB'] else 1
+
+    data = term_extraction(df, field=field_wf, stemming=False, verbose=False, 
+                                ngrams=ngrams, remove_terms=remove_terms, synonyms=synonyms)
+    data = data
+    if field_wf == 'TI':
+        print(data[f"{field_wf}_TM"])
+
+    # Calculate word frequency
+    if field_wf in ['AB', 'TI']:
+        word_freq = keyword_growth(data, tag=f"{field_wf}_TM", top=top_words[1], cdf=(occurrences == 'cumulate'), remove_terms=remove_terms, synonyms=synonyms)
+    else:
+        word_freq = keyword_growth(data, tag=field_wf, top=top_words[1], cdf=(occurrences == 'cumulate'), remove_terms=remove_terms, synonyms=synonyms)
+
+
+    # Select terms between top_words[1] and top_words[2]
+    word_freq = word_freq[['Year'] + word_freq.columns[top_words[0]:top_words[1] + 1].tolist()]
+    
+    # Reshape the data for plotting
+    word_freq_melted = word_freq.melt(id_vars=['Year'], var_name='Term', value_name='Frequency')
+
+    # Create the plot
+    fig = px.line(
+        word_freq_melted,
+        x='Year',
+        y='Frequency',
+        color='Term',
+        labels={'Year': 'Year', 'Frequency': 'Frequency', 'Term': 'Term'},
+    )
+
+    # Customize the layout
+    fig.update_layout(
+        xaxis=dict(
+            tickmode='array',
+            tickvals=word_freq['Year'].unique()[::max(1, len(word_freq['Year'].unique()) // 20)]
+        ),
+        yaxis_title="Frequency",
+        xaxis_title="Year",
+        plot_bgcolor='white',
+        title_font_size=24,
+        font=dict(color="#444444"),
+        margin=dict(l=40, r=40, t=40, b=40),
+        height=800,
+        legend=dict(
+            title="Term",
+            orientation="h",
+            yanchor="top",
+            y=-0.2,
+            xanchor="center",
+            x=0.5,
+            font=dict(size=10)
+        )
+    )
+
+    # Customize the grid
+    fig.update_xaxes(showgrid=True, gridwidth=1, gridcolor='#EFEFEF')
+    fig.update_yaxes(showgrid=True, gridwidth=1, gridcolor='#EFEFEF')
+    fig = go.FigureWidget(fig)
+    fig._config = fig._config | {'modeBarButtonsToRemove': ['pan', 'select', 'lasso2d', 'toImage'],
+                                 'displaylogo': False}
+
+    return fig, word_freq
+
+# Funzioni ausiliarie
+def trim_years(w, year_range, cdf=True):
+    """Funzione per calcolare frequenze cumulative o annuali."""
+    W = np.zeros(len(year_range))
+    Y = np.array(list(w.index))
+    w_values = np.array(w)
+
+    for i in range(len(year_range)):
+        if len(Y) > 0 and Y[0] == year_range[i]:
+            W[i] = w_values[0]
+            Y = Y[1:]
+            w_values = w_values[1:]
+
+    if cdf:
+        W = np.cumsum(W)
+
+    W = pd.Series(W, index=year_range)
+
+    return W
+
+
+def keyword_growth(df, tag, sep=";", top=10, cdf=True, remove_terms=None, synonyms=None):
+    """
+    Simula la funzione KeywordGrowth in R.
+    df: dataframe con i dati.
+    tag: colonna da analizzare.
+    sep: separatore per il parsing.
+    top: numero massimo di termini da considerare.
+    cdf: se True, calcola occorrenze cumulative.
+    remove_terms: lista di termini da rimuovere.
+    synonyms: dizionario {termine_sostituto: [lista_di_sinonimi]}.
+    """
+    # Parsing e filtraggio
+    df = df.dropna(subset=[tag])
+    expanded = [item.upper() for sublist in df[tag].apply(lambda x: x.split(sep) if isinstance(x, str) else x) for item in sublist]
+    years = df.loc[df.index.repeat(df[tag].apply(lambda x: len(x.split(sep)) if isinstance(x, str) else len(x))), 'PY'].values
+    data = pd.DataFrame({'Term': expanded, 'Year': years})
+    
+    # Rimuovi terms
+    if remove_terms:
+        data = data[~data['Term'].str.upper().isin([term.upper() for term in remove_terms])]
+    
+    # Gestione dei sinonimi
+    if synonyms:
+        for main_term, syns in synonyms.items():
+            data['Term'] = data['Term'].replace(syns, main_term.upper())
+    
+    # Aggregazione
+    freq = data.groupby(['Term', 'Year']).size().reset_index(name='Freq')
+    year_range = range(data['Year'].min(), data['Year'].max() + 1)
+    
+    # Selezione dei termini più frequenti
+    top_terms = freq.groupby('Term')['Freq'].sum().nlargest(top).index
+    freq = freq[freq['Term'].isin(top_terms)]
+
+    # Costruzione del dataframe finale
+    results = pd.DataFrame({'Year': year_range})
+    for term in top_terms:
+        term_freq = freq[freq['Term'] == term].set_index('Year')['Freq']
+        term_freq = term_freq.reindex(year_range, fill_value=0)
+        results[term] = trim_years(term_freq, year_range, cdf=cdf).values
+
+    return results
diff --git a/functions/get_worldmapcollaboration.py b/functions/get_worldmapcollaboration.py
index 9edafa879..9edfb5528 100644
--- a/functions/get_worldmapcollaboration.py
+++ b/functions/get_worldmapcollaboration.py
@@ -10,7 +10,7 @@ def get_world_map_collaboration(df, edges_min=1, edgesize=5):
     # Estrai metadati dai paesi (assumi che tu abbia già AU_CO processato)
     M = df
     df = metaTagExtraction(df, "AU_CO")
-    df = df.get()
+    df = df
 
     # Normalizza e conta le occorrenze dei paesi (come in get_countries_production)
     df["AU_CO"] = df["AU_CO"].apply(lambda x: x if isinstance(x, list) else [x])
@@ -32,6 +32,8 @@ def clean_country_names(country):
 
     # Costruisci matrice di collaborazione
     net = biblionetwork(M, analysis="collaboration", network="countries")
+    if net is None or net.empty:
+        return None, pd.DataFrame()
     net_df = pd.DataFrame(net)
 
     # Costruisci rete
diff --git a/generate_perfect_mock.py b/generate_perfect_mock.py
new file mode 100644
index 000000000..3a865cea3
--- /dev/null
+++ b/generate_perfect_mock.py
@@ -0,0 +1,36 @@
+import pandas as pd
+
+# ساخت دیتای متنوع و واقع‌گرایانه برای ارضای محاسبات ماتریس و گراف
+data = {
+    'DB': ['OPENALEX', 'OPENALEX', 'OPENALEX', 'OPENALEX', 'OPENALEX'],
+    'UT': ['W1', 'W2', 'W3', 'W4', 'W5'],
+    'TI': ['Paper One', 'Paper Two', 'Paper Three', 'Paper Four', 'Paper Five'],
+    'SO': ['J SCI', 'J SCI', 'J INFO', 'J INFO', 'J SCI'],
+    'JI': ['J1', 'J2', 'J3', 'J4', 'J5'],
+    'PY': ['2021', '2022', '2023', '2024', '2025'],
+    'DT': ['ARTICLE', 'ARTICLE', 'ARTICLE', 'ARTICLE', 'ARTICLE'],
+    'LA': ['EN', 'EN', 'EN', 'EN', 'EN'],
+    'TC': ['10', '20', '30', '40', '50'],
+    'AU': ['SMITH J; DOE J', 'DOE J; NAZARI S', 'SMITH J; NAZARI S', 'WANG X; SMITH J', 'DOE J; WANG X'],
+    'AF': ['Smith, J; Doe, J', 'Doe, J; Nazari, S', 'Smith, J; Nazari, S', 'Wang, X; Smith, J', 'Doe, J; Wang, X'],
+    'C1': ['Univ Tehr, Tehran, Iran', 'Univ Tehr, Tehran, Iran', 'Sharif Univ, Tehran, Iran', 'Sharif Univ, Tehran, Iran', 'Univ Tehr, Tehran, Iran'],
+    # دادن مراجع مختلف به مقالات برای معنادار شدن محاسبات coupling map
+    'CR': [
+        'SMITH J, 2020, J SCI, V1, P1; DOE J, 2019, J SCI',
+        'DOE J, 2019, J SCI; NAZARI S, 2021, J SCI',
+        'SMITH J, 2020, J SCI, V1, P1; NAZARI S, 2021, J SCI',
+        'WANG X, 2018, J INFO; SMITH J, 2020, J SCI',
+        'DOE J, 2019, J SCI; WANG X, 2018, J INFO'
+    ],
+    'DE': ['ETL; PYTHON', 'PYTHON; SHINY', 'ETL; SHINY', 'BIBLIOMETRICS; ETL', 'BIBLIOMETRICS; PYTHON'],
+    'AB': ['Abstract 1', 'Abstract 2', 'Abstract 3', 'Abstract 4', 'Abstract 5'],
+    'VL': ['1', '2', '3', '4', '5'],
+    'BP': ['10', '20', '30', '40', '50'],
+    'EP': ['15', '25', '35', '45', '55'],
+    'SR': ['SMITH J, 2021', 'DOE J, 2022', 'SMITH J, 2023', 'WANG X, 2024', 'DOE J, 2025'],
+    'RP': ['SMITH J', 'DOE J', 'NAZARI S', 'WANG X', 'DOE J']
+}
+
+df = pd.DataFrame(data)
+df.to_csv('standardized_output.csv', index=False)
+print("✅ Standardized output updated with diverse academic network values!")
diff --git a/shiny_log.txt b/shiny_log.txt
new file mode 100644
index 000000000..eba9211c3
--- /dev/null
+++ b/shiny_log.txt
@@ -0,0 +1,10 @@
+INFO:     Will watch for changes in these directories: ['/Users/solmaznazari/Desktop/bibliometrix-python']
+/Users/solmaznazari/Desktop/bibliometrix-python/venv/lib/python3.14/site-packages/shiny/ui/_layout_columns.py:176: UserWarning: More column widths than children at breakpoint 'sm', extra widths will be ignored.
+  ret[brk] = validate_col_width(value, n_kids, brk)
+INFO:     Uvicorn running on http://127.0.0.1:8000 (Press CTRL+C to quit)
+INFO:     Started reloader process [28020] using WatchFiles
+/Users/solmaznazari/Desktop/bibliometrix-python/venv/lib/python3.14/site-packages/shiny/ui/_layout_columns.py:176: UserWarning: More column widths than children at breakpoint 'sm', extra widths will be ignored.
+  ret[brk] = validate_col_width(value, n_kids, brk)
+INFO:     Started server process [28037]
+INFO:     Waiting for application startup.
+INFO:     Application startup complete.
diff --git a/standardized_output.csv b/standardized_output.csv
new file mode 100644
index 000000000..55c7cc353
--- /dev/null
+++ b/standardized_output.csv
@@ -0,0 +1,51 @@
+DB,UT,DI,PMID,TI,SO,JI,J9,PY,DT,LA,TC,AU,AF,C1,RP,CR,DE,ID,AB,VL,IS,BP,EP,SR,AU_UN,AU1_CO,C3
+OPENALEX,https://openalex.org/W2101234009,10.48550/arxiv.1201.0490,,Scikit-learn: Machine Learning in Python,arXiv (Cornell University),,,2012,preprint,en,63727,"['Pedregosa F.', 'Varoquaux G.', 'Gramfort A.', 'Michel V.', 'Thirion B.', 'Grisel O.', 'Blondel M.', 'Andreas M.', 'Joel N.', 'Gilles L.', 'Prettenhofer P.', 'Weiss R.', 'Dubourg V.', 'Vanderplas J.', 'Passos A.', 'Cournapeau D.', 'Brucher M.', 'Perrot M.', 'Duchesnay É.']","['Fabián Pedregosa', 'Gaël Varoquaux', 'Alexandre Gramfort', 'Vincent Michel', 'Bertrand Thirion', 'Olivier Grisel', 'Mathieu Blondel', 'Müller, Andreas', 'Nothman, Joel', 'Louppe, Gilles', 'Peter Prettenhofer', 'Ron J. Weiss', 'Vincent Dubourg', 'Jake Vanderplas', 'Alexandre Passos', 'David Cournapeau', 'Matthieu Brucher', 'Matthieu Perrot', 'Édouard Duchesnay']","[""Commissariat à l'Énergie Atomique et aux Énergies Alternatives"", 'CEA Paris-Saclay', ""Commissariat à l'Énergie Atomique et aux Énergies Alternatives"", 'CEA Paris-Saclay', ""Commissariat à l'Énergie Atomique et aux Énergies Alternatives"", 'CEA Paris-Saclay', ""Commissariat à l'Énergie Atomique et aux Énergies Alternatives"", 'CEA Paris-Saclay', ""Commissariat à l'Énergie Atomique et aux Énergies Alternatives"", 'CEA Paris-Saclay', 'Nuxe (France)', 'Kobe University', 'Bauhaus-Universität Weimar', 'Google (Canada)', 'University of Washington', 'Amherst College', 'University of Massachusetts Amherst', 'Enthought (United States)', 'Total (France)']",,"['W1496508106', 'W1571024744', 'W2024933578', 'W2035776949', 'W2040387238', 'W2047804403', 'W2063978378', 'W2097360283', 'W2097850441', 'W2118585731', 'W2146292423', 'W2152799677', 'W2153635508']","['Python (programming language)', 'Documentation', 'Computer science', 'MIT License', 'Artificial intelligence', 'Machine learning', 'Programming language', 'License', 'Software engineering', 'Operating system']","['Python (programming language)', 'Documentation', 'Computer science', 'MIT License', 'Artificial intelligence', 'Machine learning', 'Programming language', 'License', 'Software engineering', 'Operating system']",,,,,,Pedregosa 2012 arXiv VV0,Commissariat à l'Énergie Atomique et aux Énergies Alternatives;CEA Paris-Saclay;Commissariat à l'Énergie Atomique et aux Énergies Alternatives;CEA Paris-Saclay;Commissariat à l'Énergie Atomique et aux Énergies Alternatives;CEA Paris-Saclay;Commissariat à l'Énergie Atomique et aux Énergies Alternatives;CEA Paris-Saclay;Commissariat à l'Énergie Atomique et aux Énergies Alternatives;CEA Paris-Saclay;Nuxe (France);Kobe University;Bauhaus-Universität Weimar;Google (Canada);University of Washington;Amherst College;University of Massachusetts Amherst;Enthought (United States);Total (France),Commissariat à l'Énergie Atomique et aux Énergies Alternatives,Commissariat à l'Énergie Atomique et aux Énergies Alternatives;CEA Paris-Saclay;Commissariat à l'Énergie Atomique et aux Énergies Alternatives;CEA Paris-Saclay;Commissariat à l'Énergie Atomique et aux Énergies Alternatives;CEA Paris-Saclay;Commissariat à l'Énergie Atomique et aux Énergies Alternatives;CEA Paris-Saclay;Commissariat à l'Énergie Atomique et aux Énergies Alternatives;CEA Paris-Saclay;Nuxe (France);Kobe University;Bauhaus-Universität Weimar;Google (Canada);University of Washington;Amherst College;University of Massachusetts Amherst;Enthought (United States);Total (France)
+OPENALEX,https://openalex.org/W3023540311,10.5860/choice.27-0936,,"Genetic algorithms in search, optimization, and machine learning",Choice Reviews Online,,,1989,article,en,49334,[],[],[],,[],"['Computer science', 'Artificial intelligence', 'Machine learning', 'Quality control and genetic algorithms', 'Algorithm', 'Genetic algorithm', 'Meta-optimization']","['Computer science', 'Artificial intelligence', 'Machine learning', 'Quality control and genetic algorithms', 'Algorithm', 'Genetic algorithm', 'Meta-optimization']",,27,02,27,0936,UNKNOWN 1989 Choice V27,,,
+OPENALEX,https://openalex.org/W2125055259,,,C4.5: Programs for Machine Learning,,,,1992,book,en,23698,['Quinlan J.'],['J. R. Quinlan'],['University of Sydney'],,[],"['Computer science', 'Unix', 'Classifier (UML)', 'Machine learning', 'Artificial intelligence', 'Source code', 'Workstation', 'Software', 'Decision tree', 'Sample (material)', 'Software engineering', 'Data mining', 'Programming language', 'Operating system']","['Computer science', 'Unix', 'Classifier (UML)', 'Machine learning', 'Artificial intelligence', 'Source code', 'Workstation', 'Software', 'Decision tree', 'Sample (material)', 'Software engineering', 'Data mining', 'Programming language', 'Operating system', 'Chromatography', 'Chemistry']",,,,,,Quinlan 1992 UNKNOWNJ VV0,University of Sydney,University of Sydney,University of Sydney
+OPENALEX,https://openalex.org/W3120740533,,,UCI Machine Learning Repository,Medical Entomology and Zoology,,,2007,article,en,24350,['Asuncion A.'],['Arthur Asuncion'],[],,[],"['Computer science', 'Artificial intelligence']","['Computer science', 'Artificial intelligence']",,,,,,Asuncion 2007 Medical VV0,,,
+OPENALEX,https://openalex.org/W1570448133,10.1016/c2009-0-19715-5,,Data Mining: Practical Machine Learning Tools and Techniques,Elsevier eBooks,,,2011,book,en,25713,"['Witten I.', 'Frank E.', 'Hall M.']","['Ian H. Witten', 'Eibe Frank', 'Mark A. Hall']",[],,"['W23418094', 'W24402856', 'W28412257', 'W43179442', 'W64096637', 'W66926763', 'W69783631', 'W122789262', 'W123339444', 'W138217685', 'W149472151', 'W173229765', 'W187357405', 'W586094522', 'W589058777', 'W1483135265', 'W1483679765', 'W1492324553', 'W1492698999', 'W1495859460', 'W1500698297', 'W1506285740', 'W1513366687', 'W1516443426', 'W1520687314', 'W1523856491', 'W1524704912', 'W1528113134', 'W1530010412', 'W1533544838', 'W1533946607', 'W1536719366', 'W1550206324', 'W1550821944', 'W1551066950', 'W1553019137', 'W1553313034', 'W1554663460', 'W1555244713', 'W1559060276', 'W1560107318', 'W1563088657', 'W1564947197', 'W1571836963', 'W1572964175', 'W1572978214', 'W1573228426', 'W1576962511', 'W1582036668', 'W1583700199', 'W1584333058', 'W1585221258', 'W1585610988', 'W1585743408', 'W1588100052', 'W1588282782', 'W1597165973', 'W1598333443', 'W1598696986', 'W1600437712', 'W1601529450', 'W1604345466', 'W1605275907', 'W1605688901', 'W1605957858', 'W1619226191', 'W1625504505', 'W1630964756', 'W1641039719', 'W1648885110', 'W1670263352', 'W1673310716', 'W1676820704', 'W1678889691', 'W1679846099', 'W1680392829', 'W1763728792', 'W1781794689', 'W1800049145', 'W1806329564', 'W1817561967', 'W1833977909', 'W1861764418', 'W1881647329', 'W1882120692', 'W1906182963', 'W1907578970', 'W1908888846', 'W1912123407', 'W1932571505', 'W1955600018', 'W1969482724', 'W1978515644', 'W1979711143', 'W1982161962', 'W1985593448', 'W1987947967', 'W1990748933', 'W1995945562', 'W2001619934', 'W2008906462', 'W2014725748', 'W2015401436', 'W2017337590', 'W2019575783', 'W2024046085', 'W2024646871', 'W2024668293', 'W2035890032', 'W2037603696', 'W2037768235', 'W2037965136', 'W2042385018', 'W2048679005', 'W2053154970', 'W2057720927', 'W2058732827', 'W2064853889', 'W2065861851', 'W2066636486', 'W2067098334', 'W2068337856', 'W2073308541', 'W2073583237', 'W2074610805', 'W2075665712', 'W2078579128', 'W2095749253', 'W2095897464', 'W2097089247', 'W2097569937', 'W2100406636', 'W2102009083', 'W2105494575', 'W2105497548', 'W2106393550', 'W2108949035', 'W2110119381', 'W2111746072', 'W2112076978', 'W2112841646', 'W2113242816', 'W2117812871', 'W2118020653', 'W2118383892', 'W2119821739', 'W2119885577', 'W2120216197', 'W2122111042', 'W2122410182', 'W2129113961', 'W2129249398', 'W2132166479', 'W2133632100', 'W2134696506', 'W2138064700', 'W2138621811', 'W2139059214', 'W2140190241', 'W2142767931', 'W2142819948', 'W2142957916', 'W2143349571', 'W2143426320', 'W2144907232', 'W2146257637', 'W2147492008', 'W2147810216', 'W2148949939', 'W2149706766', 'W2153028052', 'W2154318594', 'W2154642793', 'W2156909104', 'W2160642098', 'W2161077873', 'W2163915185', 'W2164818318', 'W2166559705', 'W2167793421', 'W2170112109', 'W2170654002', 'W2170726034', 'W2170913656', 'W2172162418', 'W2172780573', 'W2277957941', 'W2331052961', 'W2621280964', 'W2912934387', 'W2913066018', 'W2914369697', 'W2953014340', 'W2988864014', 'W3017143921', 'W3023540311', 'W3083113686', 'W3085162807', 'W3123294050', 'W3163638146', 'W3193477162', 'W3203633735', 'W3208887124']","['Computer science', 'Machine learning', 'Data science', 'Data mining', 'Artificial intelligence']","['Computer science', 'Machine learning', 'Data science', 'Data mining', 'Artificial intelligence']",,,,,,Witten 2011 Elsevier VV0,,,
+OPENALEX,https://openalex.org/W1663973292,10.1117/1.2819119,,Pattern Recognition and Machine Learning,Journal of Electronic Imaging,,,2007,article,en,22083,['Nasrabadi N.'],['Nasser M. Nasrabadi'],"['West Virginia University', 'Microsoft Research (United Kingdom)']",,"['W1480376833', 'W1496317909', 'W2117812871', 'W3215037115', 'W4232383088', 'W4292691288']","['Computer science', 'Imaging science', 'Cover (algebra)', 'Data science', 'Artificial intelligence', 'Engineering']","['Computer science', 'Imaging science', 'Cover (algebra)', 'Data science', 'Artificial intelligence', 'Engineering', 'Mechanical engineering']",,16,4,049901,049901,Nasrabadi 2007 Journal V16,West Virginia University;Microsoft Research (United Kingdom),West Virginia University,West Virginia University;Microsoft Research (United Kingdom)
+OPENALEX,https://openalex.org/W1639032689,,,"Genetic Algorithms in Search, Optimization and Machine Learning",,,,1988,book,en,17771,"['Goldberg D.', 'Robson D.']","['David E. Goldberg', 'David Robson']",[],,[],"['Pascal (unit)', 'Computer science', 'Genetic programming', 'Genetic algorithm', 'Machine learning', 'Artificial intelligence', 'Quality control and genetic algorithms', 'Theoretical computer science', 'Algorithm', 'Programming language', 'Meta-optimization']","['Pascal (unit)', 'Computer science', 'Genetic programming', 'Genetic algorithm', 'Machine learning', 'Artificial intelligence', 'Quality control and genetic algorithms', 'Theoretical computer science', 'Algorithm', 'Programming language', 'Meta-optimization']",,,,,,Goldberg 1988 UNKNOWNJ VV0,,,
+OPENALEX,https://openalex.org/W1583837637,10.1145/1273496,,Proceedings of the 24th international conference on Machine learning,,,,2007,preprint,en,11734,[],[],[],,[],"['Presentation (obstetrics)', 'Library science', 'Computer science', 'Medical education', 'Medicine']","['Presentation (obstetrics)', 'Library science', 'Computer science', 'Medical education', 'Medicine', 'Radiology']",,,,,,UNKNOWN 2007 UNKNOWNJ VV0,,,
+OPENALEX,https://openalex.org/W1746819321,10.7551/mitpress/3206.001.0001,,Gaussian Processes for Machine Learning,The MIT Press eBooks,,,2005,book,en,10489,"['Rasmussen C.', 'Williams C.']","['Carl Edward Rasmussen', 'Christopher K. I. Williams']","['Max Planck Society', 'Max Planck Institute for Biological Cybernetics']",,"['W14377099', 'W44447720', 'W61071295', 'W131514509', 'W186419298', 'W336602872', 'W1213006044', 'W1484867920', 'W1486089539', 'W1486164486', 'W1496317909', 'W1497675750', 'W1505043854', 'W1506153731', 'W1510355813', 'W1512098439', 'W1512149552', 'W1515272691', 'W1543996294', 'W1549258098', 'W1550570395', 'W1551209770', 'W1554663460', 'W1564947197', 'W1567512734', 'W1571894236', 'W1574225613', 'W1598589417', 'W1601740268', 'W1604293137', 'W1607751291', 'W1618393386', 'W1618449801', 'W1628829797', 'W1633751774', 'W1642427530', 'W1648445109', 'W1654787807', 'W1755117326', 'W1859781365', 'W1963533512', 'W1965999112', 'W1967396577', 'W1975780894', 'W1976382401', 'W1976625337', 'W1978188282', 'W1978394996', 'W1981025032', 'W1982032418', 'W1982276155', 'W1986280275', 'W1995672551', 'W1998167411', 'W2000241167', 'W2003706076', 'W2003870625', 'W2006314423', 'W2008827410', 'W2014831690', 'W2015904350', 'W2018044188', 'W2019363670', 'W2020999234', 'W2023163512', 'W2033839039', 'W2041863660', 'W2047028564', 'W2049387919', 'W2056735347', 'W2062291655', 'W2063852603', 'W2065540158', 'W2069371995', 'W2069527924', 'W2072555316', 'W2078206416', 'W2081873601', 'W2085877024', 'W2087978636', 'W2088538739', 'W2090102379', 'W2090353374', 'W2093268114', 'W2094169479', 'W2094212611', 'W2096335861', 'W2098115979', 'W2098626000', 'W2098949458', 'W2100136038', 'W2101709642', 'W2103972570', 'W2104533781', 'W2106868411', 'W2107152312', 'W2107636931', 'W2107725114', 'W2108966602', 'W2111176881', 'W2111494971', 'W2112545207', 'W2114229504', 'W2114412769', 'W2115606304', 'W2116723448', 'W2117063635', 'W2117812871', 'W2118195892', 'W2123687908', 'W2124101779', 'W2124225821', 'W2126455177', 'W2127713198', 'W2129564505', 'W2129869373', 'W2130475491', 'W2130859329', 'W2137467792', 'W2137557016', 'W2137956165', 'W2139479120', 'W2140170995', 'W2140251433', 'W2141274633', 'W2141436719', 'W2142182841', 'W2142387771', 'W2142575165', 'W2143022286', 'W2143956139', 'W2144286620', 'W2145295623', 'W2146766088', 'W2148603752', 'W2149417376', 'W2149846618', 'W2151238122', 'W2152701363', 'W2152937653', 'W2153347097', 'W2153756422', 'W2156909104', 'W2158451137', 'W2158529569', 'W2160840682', 'W2161767008', 'W2162114812', 'W2163057507', 'W2167061265', 'W2167986580', 'W2168022998', 'W2169779569', 'W2170076406', 'W2170078560', 'W2170120409', 'W2170334710', 'W2171522835', 'W2172039283', 'W2296319761', 'W2408196097', 'W2464224693', 'W2548695521', 'W2554813760', 'W2782810849', 'W2797583072', 'W2798909945', 'W2904816695', 'W2916304084', 'W2989448192', 'W3014600732', 'W3017143921', 'W3023786531', 'W3048078645', 'W3119264854', 'W3127325877', 'W3134067276', 'W3140968660', 'W3148924112', 'W3165771198']","['Machine learning', 'Artificial intelligence', 'Computer science', 'Online machine learning', 'Gaussian process', 'Probabilistic logic', 'Relevance vector machine', 'Support vector machine', 'Kernel method', 'Artificial neural network', 'Gaussian']","['Machine learning', 'Artificial intelligence', 'Computer science', 'Online machine learning', 'Gaussian process', 'Probabilistic logic', 'Relevance vector machine', 'Support vector machine', 'Kernel method', 'Artificial neural network', 'Gaussian', 'Quantum mechanics', 'Physics']",,,,,,Rasmussen 2005 The VV0,Max Planck Society;Max Planck Institute for Biological Cybernetics,Max Planck Society,Max Planck Society;Max Planck Institute for Biological Cybernetics
+OPENALEX,https://openalex.org/W1503398984,,,Machine learning a probabilistic perspective,,,,2012,book,en,9328,['Murphy K.'],['Kevin P. Murphy'],[],,[],"['Computer science', 'Probabilistic logic', 'Artificial intelligence', 'Field (mathematics)', 'Conditional random field', 'Heuristic', 'Machine learning', 'Graphical model', 'Regularization (linguistics)', 'Software', 'Programming language']","['Computer science', 'Probabilistic logic', 'Artificial intelligence', 'Field (mathematics)', 'Conditional random field', 'Heuristic', 'Machine learning', 'Graphical model', 'Regularization (linguistics)', 'Software', 'Programming language', 'Pure mathematics', 'Mathematics']",,,,,,Murphy 2012 UNKNOWNJ VV0,,,
+OPENALEX,https://openalex.org/W1901616594,10.1126/science.aaa8415,26185243,"Machine learning: Trends, perspectives, and prospects",Science,,,2015,review,en,9553,"['Jordan M.', 'Mitchell T.']","['Michael I. Jordan', 'Tom M. Mitchell']","['University of California, Berkeley', 'Carnegie Mellon University']",,"['W99485931', 'W1503398984', 'W1512585804', 'W1554944419', 'W1569098853', 'W1873763122', 'W1970472910', 'W1992570774', 'W1999352252', 'W2006452405', 'W2019363670', 'W2042469398', 'W2047281923', 'W2076063813', 'W2097381042', 'W2100495367', 'W2117726420', 'W2127180992', 'W2132001804', 'W2145339207', 'W2146774335', 'W2151320232', 'W2160815625', 'W2163605009', 'W2174706414', 'W2618530766', 'W3102480238', 'W4214717370', 'W4231109964', 'W4238893454', 'W4244670803', 'W4292363360']","['Intersection (aeronautics)', 'Computer science', 'Artificial intelligence', 'Core (optical fiber)', 'Data science', 'Machine learning', 'Big data', 'Computation', 'Lying', 'Engineering', 'Data mining']","['Intersection (aeronautics)', 'Computer science', 'Artificial intelligence', 'Core (optical fiber)', 'Data science', 'Machine learning', 'Big data', 'Computation', 'Lying', 'Engineering', 'Data mining', 'Aerospace engineering', 'Radiology', 'Telecommunications', 'Medicine', 'Algorithm']",,349,6245,255,260,Jordan 2015 Science V349,"University of California, Berkeley;Carnegie Mellon University",Berkeley,"University of California, Berkeley;Carnegie Mellon University"
+OPENALEX,https://openalex.org/W4212863985,10.1007/978-0-387-45528-0,,Pattern Recognition and Machine Learning,,,,2006,book,en,9861,[],[],[],,[],"['Computer science', 'Artificial intelligence', 'Pattern recognition (psychology)']","['Computer science', 'Artificial intelligence', 'Pattern recognition (psychology)']",,,,,,UNKNOWN 2006 UNKNOWNJ VV0,,,
+OPENALEX,https://openalex.org/W2084812512,,,UCI Repository of machine learning databases,Medical Entomology and Zoology,,,1998,article,en,10547,['Blake C.'],['Catherine Blake'],[],,[],"['Computer science', 'Database', 'Artificial intelligence']","['Computer science', 'Database', 'Artificial intelligence']",,,,,,Blake 1998 Medical VV0,,,
+OPENALEX,https://openalex.org/W2997591727,10.5555/1953048.2078195,,Scikit-learn: Machine Learning in Python,Journal of Machine Learning Research,,,2011,article,en,8216,"['PedregosaFabian', 'VaroquauxGaël', 'GramfortAlexandre', 'MichelVincent', 'ThirionBertrand', 'GriselOlivier', 'BlondelMathieu', 'PrettenhoferPeter', 'WeissRon', 'DubourgVincent', 'VanderplasJake', 'PassosAlexandre', 'CournapeauDavid', 'BrucherMatthieu', 'PerrotMatthieu', 'DuchesnayÉdouard']","['PedregosaFabian', 'VaroquauxGaël', 'GramfortAlexandre', 'MichelVincent', 'ThirionBertrand', 'GriselOlivier', 'BlondelMathieu', 'PrettenhoferPeter', 'WeissRon', 'DubourgVincent', 'VanderplasJake', 'PassosAlexandre', 'CournapeauDavid', 'BrucherMatthieu', 'PerrotMatthieu', 'DuchesnayÉdouard']",[],,[],"['Python (programming language)', 'Computer science', 'Artificial intelligence', 'Machine learning', 'Programming language']","['Python (programming language)', 'Computer science', 'Artificial intelligence', 'Machine learning', 'Programming language']",,,,,,PedregosaFabian 2011 Journal VV0,,,
+OPENALEX,https://openalex.org/W2953384591,10.48550/arxiv.1605.08695,,TensorFlow: A system for large-scale machine learning,arXiv (Cornell University),,,2016,preprint,en,8823,"['Abadi M.', 'Barham P.', 'Chen J.', 'Chen Z.', 'Davis A.', 'Dean J.', 'Devin M.', 'Ghemawat S.', 'Irving G.', 'Isard M.', 'Kudlur M.', 'Levenberg J.', 'Monga R.', 'Moore S.', 'Murray D.', 'Steiner B.', 'Tucker P.', 'Vasudevan V.', 'Warden P.', 'Wicke M.', 'Yu Y.', 'Zheng X.']","['Martı́n Abadi', 'Paul Barham', 'Jianmin Chen', 'Zhifeng Chen', 'Andy Davis', 'Jay B. Dean', 'Matthieu Devin', 'Sanjay Ghemawat', 'Geoffrey Irving', 'Michael Isard', 'Manjunath Kudlur', 'Josh Levenberg', 'Rajat Monga', 'Sherry Moore', 'Derek G. Murray', 'Benoit Steiner', 'Paul A. Tucker', 'Vijay Vasudevan', 'Pete Warden', 'Martin Wicke', 'Yuan Yu', 'Xiaoqiang Zheng']","['Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)']",,"['W104184427', 'W145476170', 'W941230081', 'W1442374986', 'W1484210532', 'W1485981043', 'W1493893823', 'W1498436455', 'W1548328233', 'W1598866093', 'W1658008008', 'W1667652561', 'W1869752048', 'W1978660892', 'W1992479210', 'W2041517243', 'W2055312318', 'W2061570747', 'W2066443755', 'W2072566913', 'W2083842231', 'W2099471712', 'W2100664567', 'W2109722477', 'W2117539524', 'W2120480077', 'W2131400476', 'W2131975293', 'W2132339004', 'W2140833774', 'W2141992894', 'W2145339207', 'W2146757372', 'W2160815625', 'W2163961697', 'W2168231600', 'W2173213060', 'W2186615578', 'W2198403777', 'W2259472270', 'W2308045930', 'W2336650964', 'W2339765813', 'W2384495648', 'W2591588155', 'W2949117887', 'W2949245006', 'W2949501655', 'W2949605076', 'W2949650786', 'W2949888546', 'W2950094539', 'W2950179405', 'W2950577311', 'W2951714314', 'W2951781666']","['Scale (ratio)', 'Computer science', 'Artificial intelligence', 'Machine learning', 'Cartography', 'Geography']","['Scale (ratio)', 'Computer science', 'Artificial intelligence', 'Machine learning', 'Cartography', 'Geography']",,,,,,Abadi 2016 arXiv VV0,Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States),Google (United States),Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States)
+OPENALEX,https://openalex.org/W2118020653,10.1145/505282.505283,,Machine learning in automated text categorization,ACM Computing Surveys,,,2002,review,en,7890,['Sebastiani F.'],['Fabrizio Sebastiani'],['Consorzio Pisa Ricerche'],,"['W12876238', 'W22906612', 'W35304842', 'W59979790', 'W74894479', 'W81384683', 'W81511778', 'W104970664', 'W107306860', 'W112196149', 'W116328816', 'W148103248', 'W166124110', 'W1482260847', 'W1487445520', 'W1490175418', 'W1493526108', 'W1505794130', 'W1507179106', 'W1508175965', 'W1513874326', 'W1514707997', 'W1520963883', 'W1522930027', 'W1523389133', 'W1523949738', 'W1533946607', 'W1544227718', 'W1547553618', 'W1550961891', 'W1553682320', 'W1556094091', 'W1561056154', 'W1574901103', 'W1576676390', 'W1577216492', 'W1578881253', 'W1591234214', 'W1592212241', 'W1594962278', 'W1597379537', 'W1601145406', 'W1619226191', 'W1620204465', 'W1813610639', 'W1857571498', 'W1907380269', 'W1924689489', 'W1966065191', 'W1969572066', 'W1970858159', 'W1970974276', 'W1971666241', 'W1973911615', 'W1975496312', 'W1977182536', 'W1978394996', 'W1979648751', 'W1980776671', 'W1983078185', 'W1986913017', 'W1988711048', 'W1989568037', 'W1989738209', 'W1993657037', 'W1993934121', 'W1995014490', 'W2001664274', 'W2002675557', 'W2002857471', 'W2003436527', 'W2004180556', 'W2004871537', 'W2005422315', 'W2005758492', 'W2006119904', 'W2006187024', 'W2007395264', 'W2007512902', 'W2008931716', 'W2009190245', 'W2010652031', 'W2013657661', 'W2015267443', 'W2015518873', 'W2017867386', 'W2019778169', 'W2020316999', 'W2025451713', 'W2029609769', 'W2033751006', 'W2035754578', 'W2040424159', 'W2041726831', 'W2043909051', 'W2045812729', 'W2047031127', 'W2049384587', 'W2053463056', 'W2058982198', 'W2059019405', 'W2060216474', 'W2060476676', 'W2060704583', 'W2062847911', 'W2062914707', 'W2063198646', 'W2063862666', 'W2064580901', 'W2065010255', 'W2065747622', 'W2066462377', 'W2071415686', 'W2071664212', 'W2076008912', 'W2077777431', 'W2080251601', 'W2084044465', 'W2085302848', 'W2085989833', 'W2087609354', 'W2088658068', 'W2092134162', 'W2092488901', 'W2092689128', 'W2093098531', 'W2094934653', 'W2096152098', 'W2096411881', 'W2097089247', 'W2097847889', 'W2101154521', 'W2104808840', 'W2106365165', 'W2107008379', 'W2107827038', 'W2110224739', 'W2114535528', 'W2125776553', 'W2126502509', 'W2126631147', 'W2126850915', 'W2127994451', 'W2130337399', 'W2132315067', 'W2133890944', 'W2135276756', 'W2139578439', 'W2140785063', 'W2140956226', 'W2142515059', 'W2145036943', 'W2145296344', 'W2146888100', 'W2147152072', 'W2149684865', 'W2151801809', 'W2153211312', 'W2153962014', 'W2158738673', 'W2165612380', 'W2169384781', 'W2170654002', 'W2172142456', 'W2174678383', 'W2435251607', 'W2561675875', 'W2798573942', 'W2915186198', 'W2949696181', 'W2952299822', 'W2953123431', 'W3042893949', 'W3157411736', 'W4205241946', 'W4240008182', 'W4249379282', 'W4285719527', 'W6604296810', 'W6614676750', 'W6629232668', 'W6630268012', 'W6631307659', 'W6632118081', 'W6633640926', 'W6635379667', 'W6635548358', 'W6636628491', 'W6638423001', 'W6641777427', 'W6643036076', 'W6644484350', 'W6666817399', 'W6673691841', 'W6673781366', 'W6679004887', 'W6679453733', 'W6681835404', 'W6682342947', 'W6738852829', 'W6792154874', 'W6794861161', 'W7046466245', 'W7064660697']","['Computer science', 'Categorization', 'Software portability', 'Artificial intelligence', 'Classifier (UML)', 'Machine learning', 'Text categorization', 'Natural language processing']","['Computer science', 'Categorization', 'Software portability', 'Artificial intelligence', 'Classifier (UML)', 'Machine learning', 'Text categorization', 'Natural language processing', 'Programming language']",,34,1,1,47,Sebastiani 2002 ACM V34,Consorzio Pisa Ricerche,Consorzio Pisa Ricerche,Consorzio Pisa Ricerche
+OPENALEX,https://openalex.org/W1504694836,,,Programs for Machine Learning,,,,1994,article,en,5804,"['Salzberg S.', 'Segre A.']","['Steven L. Salzberg', 'Alberto M. Segre']",['Johns Hopkins University'],,"['W1534707631', 'W1573640198', 'W1594031697', 'W1604329830', 'W2149706766', 'W3085162807']","['Successor cardinal', 'Artificial intelligence', 'Computer science', 'Decision tree', 'Machine learning', 'Subject (documents)', 'ID3 algorithm', 'Decision tree learning', 'Incremental decision tree', 'World Wide Web', 'Mathematics']","['Successor cardinal', 'Artificial intelligence', 'Computer science', 'Decision tree', 'Machine learning', 'Subject (documents)', 'ID3 algorithm', 'Decision tree learning', 'Incremental decision tree', 'World Wide Web', 'Mathematics', 'Mathematical analysis']",,,,,,Salzberg 1994 UNKNOWNJ VV0,Johns Hopkins University,Johns Hopkins University,Johns Hopkins University
+OPENALEX,https://openalex.org/W1601795611,10.1108/03684920710743466,,Pattern Recognition and Machine Learning,Kybernetes,,,2007,article,en,8434,[],[],[],,[],"['Computer science', 'Cybernetics', 'Artificial intelligence', 'Machine learning']","['Computer science', 'Cybernetics', 'Artificial intelligence', 'Machine learning']",,36,2,275,275,UNKNOWN 2007 Kybernetes V36,,,
+OPENALEX,https://openalex.org/W2271840356,10.48550/arxiv.1603.04467,,TensorFlow: Large-Scale Machine Learning on Heterogeneous Distributed Systems,arXiv (Cornell University),,,2016,preprint,en,9777,"['Abadi M.', 'Agarwal A.', 'Barham P.', 'Brevdo E.', 'Chen Z.', 'Citro C.', 'Corrado G.', 'Davis A.', 'Dean J.', 'Devin M.', 'Ghemawat S.', 'Goodfellow I.', 'Harp A.', 'Irving G.', 'Isard M.', 'Jia Y.', 'Józefowicz R.', 'Kaiser Ł.', 'Kudlur M.', 'Levenberg J.', 'Mané D.', 'Monga R.', 'Moore S.', 'Murray D.', 'Olah C.', 'Schuster M.', 'Shlens J.', 'Steiner B.', 'Sutskever I.', 'Talwar K.', 'Tucker P.', 'Vanhoucke V.', 'Vasudevan V.', 'Viégas F.', 'Vinyals O.', 'Warden P.', 'Wattenberg M.', 'Wicke M.', 'Yu Y.', 'Zheng X.']","['Martı́n Abadi', 'Ashish Agarwal', 'Paul Barham', 'Eugene Brevdo', 'Zhifeng Chen', 'Craig Citro', 'Gregory S. Corrado', 'Andy Davis', 'Jay B. Dean', 'Matthieu Devin', 'Sanjay Ghemawat', 'Ian Goodfellow', 'Andrew Harp', 'Geoffrey Irving', 'Michael Isard', 'Yangqing Jia', 'Rafał Józefowicz', 'Łukasz Kaiser', 'Manjunath Kudlur', 'Josh Levenberg', 'Dan Mané', 'Rajat Monga', 'Sherry Moore', 'Derek G. Murray', 'Chris Olah', 'Mike Schuster', 'Jonathon Shlens', 'Benoit Steiner', 'Ilya Sutskever', 'Kunal Talwar', 'Paul A. Tucker', 'Vincent Vanhoucke', 'Vijay Vasudevan', 'Fernanda Viégas', 'Oriol Vinyals', 'Pete Warden', 'Martin Wattenberg', 'Martin Wicke', 'Yuan Yu', 'Xiaoqiang Zheng']",[],,"['W1442374986', 'W1484210532', 'W1487337216', 'W1498436455', 'W1526734559', 'W1548328233', 'W1598866093', 'W1614298861', 'W1658008008', 'W1667652561', 'W1738019091', 'W1827297289', 'W1869752048', 'W1947291763', 'W1978660892', 'W1978924650', 'W2002257715', 'W2016053056', 'W2017351599', 'W2032036568', 'W2035424729', 'W2055312318', 'W2064675550', 'W2082171780', 'W2097117768', 'W2100830825', 'W2123024445', 'W2130942839', 'W2131975293', 'W2138243089', 'W2141992894', 'W2146757372', 'W2155893237', 'W2160815625', 'W2168231600', 'W2171532807', 'W2181607856', 'W2253807446', 'W2507756961', 'W2949117887', 'W2950789693', 'W2951781666']","['Scale (ratio)', 'Computer science', 'Artificial intelligence', 'Machine learning', 'Distributed computing', 'Geography', 'Cartography']","['Scale (ratio)', 'Computer science', 'Artificial intelligence', 'Machine learning', 'Distributed computing', 'Geography', 'Cartography']",,,,,,Abadi 2016 arXiv VV0,,,
+OPENALEX,https://openalex.org/W3163993681,10.1038/s42254-021-00314-5,,Physics-informed machine learning,Nature Reviews Physics,,,2021,review,en,6522,"['Karniadakis G.', 'Kevrekidis I.', 'Lu L.', 'Perdikaris P.', 'Wang S.', 'Yang L.']","['George Em Karniadakis', 'Ioannis G. Kevrekidis', 'Lu Lu', 'Paris Perdikaris', 'Sifan Wang', 'Liu Yang']","['Brown University', 'Johns Hopkins University', 'Massachusetts Institute of Technology', 'University of Pennsylvania', 'Applied Mathematics (United States)', 'University of Pennsylvania', 'Brown University']",,"['W196871588', 'W1538131130', 'W1543241987', 'W1731081199', 'W1856502440', 'W1899249567', 'W1972005403', 'W1972576201', 'W1976068300', 'W1979769287', 'W2000359198', 'W2002355073', 'W2017880874', 'W2018159038', 'W2019465613', 'W2020561998', 'W2025444507', 'W2060229389', 'W2072072671', 'W2099471712', 'W2101371964', 'W2125645174', 'W2134164499', 'W2142894919', 'W2143225719', 'W2149498546', 'W2158985775', 'W2194775991', 'W2212370034', 'W2234882433', 'W2239232218', 'W2261689926', 'W2277172374', 'W2323851192', 'W2402144811', 'W2474090883', 'W2486824498', 'W2507348356', 'W2534240011', 'W2550848904', 'W2551156993', 'W2558748708', 'W2573864470', 'W2600297185', 'W2605147767', 'W2619381903', 'W2742127985', 'W2749028154', 'W2777417212', 'W2783378529', 'W2786232134', 'W2787931125', 'W2803629276', 'W2809090039', 'W2810026216', 'W2811199191', 'W2856628251', 'W2884775584', 'W2886802770', 'W2887569307', 'W2890889625', 'W2890968382', 'W2893749619', 'W2893813411', 'W2896549049', 'W2897097528', 'W2899283552', 'W2899971035', 'W2900369848', 'W2901203181', 'W2907047316', 'W2908541468', 'W2909320927', 'W2912389156', 'W2912465314', 'W2912649832', 'W2913323966', 'W2914483840', 'W2914520121', 'W2919958648', 'W2936357167', 'W2945102878', 'W2946794331', 'W2946866513', 'W2947072793', 'W2951392159', 'W2952046647', 'W2959995783', 'W2962793481', 'W2963021886', 'W2963063862', 'W2963095610', 'W2963190151', 'W2963518130', 'W2963634130', 'W2963716063', 'W2963755523', 'W2963901342', 'W2964059111', 'W2964088238', 'W2964121744', 'W2964135722', 'W2964212578', 'W2964268978', 'W2966284335', 'W2969381807', 'W2970100546', 'W2970971581', 'W2971095480', 'W2971343405', 'W2972153210', 'W2973886134', 'W2975003945', 'W2977109506', 'W2978281981', 'W2979712029', 'W2979786244', 'W2980147119', 'W2980592884', 'W2980973551', 'W2983902802', 'W2991298115', 'W2991550674', 'W2994626356', 'W2994747787', 'W2997814214', 'W2999026783', 'W2999467285', 'W3003747211', 'W3003922491', 'W3004450693', 'W3005610174', 'W3007470329', 'W3007740214', 'W3008453832', 'W3009784374', 'W3010849941', 'W3011147100', 'W3011806874', 'W3012417314', 'W3012621877', 'W3014009018', 'W3014468003', 'W3015176898', 'W3015606043', 'W3015865829', 'W3016703299', 'W3022657828', 'W3023982288', 'W3025645353', 'W3026222427', 'W3028316595', 'W3028529071', 'W3035493266', 'W3036843665', 'W3037090957', 'W3039304986', 'W3040277050', 'W3041984619', 'W3043174105', 'W3043516796', 'W3045146186', 'W3046173836', 'W3047001618', 'W3048241795', 'W3049075514', 'W3080393992', 'W3081814969', 'W3082908155', 'W3082977546', 'W3084017095', 'W3088681382', 'W3088691598', 'W3088877001', 'W3093018961', 'W3093190107', 'W3093786597', 'W3093990252', 'W3096173239', 'W3096732413', 'W3098172061', 'W3098195931', 'W3098370560', 'W3098546160', 'W3098951945', 'W3099849883', 'W3100156752', 'W3101260193', 'W3101396145', 'W3102139197', 'W3102569296', 'W3102697518', 'W3102845444', 'W3102921872', 'W3103242287', 'W3104150464', 'W3104873019', 'W3105982350', 'W3106050203', 'W3107691001', 'W3107973042', 'W3112233611', 'W3112264320', 'W3116268267', 'W3118310857', 'W3125167458', 'W3128400532', 'W3129530645', 'W3129610195', 'W3132277775', 'W3133338006', 'W3133608513', 'W3137240924', 'W3137474564', 'W3138463430', 'W3145000844', 'W3148629269', 'W3168386838', 'W3181271387', 'W3201460085', 'W3207890637', 'W4230953281', 'W4234008654', 'W6694756022', 'W6713134421', 'W6755308174', 'W6763197053', 'W6787451610']","['Computer science', 'Artificial intelligence', 'Machine learning', 'Multiphysics', 'Inference', 'Artificial neural network', 'Physical law', 'Field (mathematics)', 'Discretization', 'Kernel method', 'Deep learning', 'Theoretical computer science', 'Mathematics', 'Support vector machine', 'Finite element method']","['Computer science', 'Artificial intelligence', 'Machine learning', 'Multiphysics', 'Inference', 'Artificial neural network', 'Physical law', 'Field (mathematics)', 'Discretization', 'Kernel method', 'Deep learning', 'Theoretical computer science', 'Mathematics', 'Support vector machine', 'Finite element method', 'Mathematical analysis', 'Philosophy', 'Pure mathematics', 'Physics', 'Epistemology', 'Thermodynamics']",,3,6,422,440,Karniadakis 2021 Nature V3,Brown University;Johns Hopkins University;Massachusetts Institute of Technology;University of Pennsylvania;Applied Mathematics (United States);University of Pennsylvania;Brown University,Brown University,Brown University;Johns Hopkins University;Massachusetts Institute of Technology;University of Pennsylvania;Applied Mathematics (United States);University of Pennsylvania;Brown University
+OPENALEX,https://openalex.org/W1534477342,10.1007/3-540-45014-9_1,,Ensemble Methods in Machine Learning,Lecture notes in computer science,,,2000,book-chapter,en,7840,['Dietterich T.'],['Thomas G. Dietterich'],['Oregon State University'],,"['W195465510', 'W1482451543', 'W1553313034', 'W1578772208', 'W1605688901', 'W1676820704', 'W1970074386', 'W1988790447', 'W1991418450', 'W2019778169', 'W2027197837', 'W2032210760', 'W2037699108', 'W2042614373', 'W2098191394', 'W2112076978', 'W2135293965', 'W2148520070', 'W2152761983', 'W2912934387', 'W2914859268', 'W4212774754', 'W4242746271', 'W6676769703', 'W6808111085']","['Computer science', 'Overfitting', 'Ensemble learning', 'Boosting (machine learning)', 'AdaBoost', 'Artificial intelligence', 'Machine learning', 'Classifier (UML)', 'Bayesian probability', 'Pattern recognition (psychology)', 'Artificial neural network']","['Computer science', 'Overfitting', 'Ensemble learning', 'Boosting (machine learning)', 'AdaBoost', 'Artificial intelligence', 'Machine learning', 'Classifier (UML)', 'Bayesian probability', 'Pattern recognition (psychology)', 'Artificial neural network']",,,,1,15,Dietterich 2000 Lecture VV0,Oregon State University,Oregon State University,Oregon State University
+OPENALEX,https://openalex.org/W2559394418,10.1038/nature23474,28905917,Quantum machine learning,Nature,,,2017,article,en,4433,"['Biamonte J.', 'Wittek P.', 'Pancotti N.', 'Rebentrost P.', 'Wiebe N.', 'Lloyd S.']","['Jacob Biamonte', 'Péter Wittek', 'Nicola Pancotti', 'Patrick Rebentrost', 'Nathan Wiebe', 'Seth Lloyd']","['Skolkovo Institute of Science and Technology', 'Institute of Photonic Sciences', 'Max Planck Institute of Quantum Optics', 'Massachusetts Institute of Technology', 'Microsoft (United States)', 'Massachusetts Institute of Technology']",,"['W51943945', 'W118877790', 'W199424061', 'W882068046', 'W999198455', 'W1479793620', 'W1492999010', 'W1503870031', 'W1529944915', 'W1534582174', 'W1559984405', 'W1568345435', 'W1631356911', 'W1684389741', 'W1703581136', 'W1743210689', 'W1872619987', 'W1965702053', 'W1968390152', 'W1968561119', 'W1979692035', 'W1980314119', 'W1981783889', 'W1983561139', 'W1988369744', 'W1994630055', 'W2001157051', 'W2010505240', 'W2015811642', 'W2019658260', 'W2021276590', 'W2022786335', 'W2028918948', 'W2030545386', 'W2035551859', 'W2040792108', 'W2040870580', 'W2041506125', 'W2042127289', 'W2046481556', 'W2051446825', 'W2055784634', 'W2064517571', 'W2069563009', 'W2075236172', 'W2086236885', 'W2097981279', 'W2101403221', 'W2103956991', 'W2104944940', 'W2106090814', 'W2110322033', 'W2120480077', 'W2120802379', 'W2124269824', 'W2153346333', 'W2153887174', 'W2155728415', 'W2156909104', 'W2170504083', 'W2188879252', 'W2195198640', 'W2207520826', 'W2207698480', 'W2221147613', 'W2262683142', 'W2266138411', 'W2272691542', 'W2306477081', 'W2327049932', 'W2334150129', 'W2337082154', 'W2341702711', 'W2397157153', 'W2409645286', 'W2419175238', 'W2468412683', 'W2478948476', 'W2489886790', 'W2490964415', 'W2495424399', 'W2516533688', 'W2517233404', 'W2521267242', 'W2528744766', 'W2557392572', 'W2560386163', 'W2571629069', 'W2579928628', 'W2580674237', 'W2582909346', 'W2595654587', 'W2604642811', 'W2607911764', 'W2612799626', 'W2751668559', 'W2764347725', 'W2766518897', 'W2768556639', 'W2919115771', 'W2949537205', 'W2951663210', 'W2952050628', 'W2962688653', 'W2962821153', 'W2962954040', 'W2963060324', 'W2963331258', 'W2963614945', 'W2963762919', 'W2964039664', 'W3022610800', 'W3023478445', 'W3098126014', 'W3098768946', 'W3098965398', 'W3099695580', 'W3100863707', 'W3101664568', 'W3102047485', 'W3103372543', 'W3104450852', 'W3104599990', 'W3105377867', 'W3106418633', 'W3111297213', 'W4230674625', 'W4297801632', 'W4301805094', 'W6687462962']","['Quantum machine learning', 'Computer science', 'Quantum', 'Software', 'Field (mathematics)', 'Quantum computer', 'Artificial intelligence', 'Computer engineering', 'Programming language', 'Physics', 'Mathematics']","['Quantum machine learning', 'Computer science', 'Quantum', 'Software', 'Field (mathematics)', 'Quantum computer', 'Artificial intelligence', 'Computer engineering', 'Programming language', 'Physics', 'Mathematics', 'Pure mathematics', 'Quantum mechanics']",,549,7671,195,202,Biamonte 2017 Nature V549,Skolkovo Institute of Science and Technology;Institute of Photonic Sciences;Max Planck Institute of Quantum Optics;Massachusetts Institute of Technology;Microsoft (United States);Massachusetts Institute of Technology,Skolkovo Institute of Science and Technology,Skolkovo Institute of Science and Technology;Institute of Photonic Sciences;Max Planck Institute of Quantum Optics;Massachusetts Institute of Technology;Microsoft (United States);Massachusetts Institute of Technology
+OPENALEX,https://openalex.org/W2912213068,10.1145/3298981,,Federated Machine Learning,ACM Transactions on Intelligent Systems and Technology,,,2019,article,en,5855,"['Yang Q.', 'Liu Y.', 'Chen T.', 'Tong Y.']","['Qiang Yang', 'Yang Liu', 'Tianjian Chen', 'Yongxin Tong']","['Hong Kong University of Science and Technology', 'Beihang University']",,"['W150223756', 'W162878246', 'W199752024', 'W1484769234', 'W1485800369', 'W1488526968', 'W1510952750', 'W1559506103', 'W1574534563', 'W1964366273', 'W1968265138', 'W1971991172', 'W1985511977', 'W2016758618', 'W2024652123', 'W2027471022', 'W2041416246', 'W2053637704', 'W2082624086', 'W2092422002', 'W2093367651', 'W2109426455', 'W2112022568', 'W2112340198', 'W2128906841', 'W2132737349', 'W2137351756', 'W2139336600', 'W2159024459', 'W2165698076', 'W2257979135', 'W2283463896', 'W2295292576', 'W2317339301', 'W2435473771', 'W2473418344', 'W2530417694', 'W2536058570', 'W2577421826', 'W2585580772', 'W2591882872', 'W2606882085', 'W2618494520', 'W2679684481', 'W2701059868', 'W2757853533', 'W2765200655', 'W2766255512', 'W2767079719', 'W2768347741', 'W2773194476', 'W2774000609', 'W2777914285', 'W2781091734', 'W2788629937', 'W2793216106', 'W2793925626', 'W2794888826', 'W2798551148', 'W2799803467', 'W2801958627', 'W2807006176', 'W2810065831', 'W2886722183', 'W2895865029', 'W2914304175', 'W2949140995', 'W2950460048', 'W2951152347', 'W2951368041', 'W2951798842', 'W2962877476', 'W2963106566', 'W2990138404', 'W3029558105', 'W3209546151', 'W4248358572', 'W4249529812', 'W4300427714', 'W4301418013', 'W4301483968', 'W6606067566', 'W6732586565', 'W6738383168', 'W6807767519']","['Computer science', 'Federated learning', 'Transfer of learning', 'Artificial intelligence', 'Data science', 'Computer security']","['Computer science', 'Federated learning', 'Transfer of learning', 'Artificial intelligence', 'Data science', 'Computer security']",,10,2,1,19,Yang 2019 ACM V10,Hong Kong University of Science and Technology;Beihang University,Hong Kong University of Science and Technology,Hong Kong University of Science and Technology;Beihang University
+OPENALEX,https://openalex.org/W2402144811,10.5555/3026877.3026899,,TensorFlow: a system for large-scale machine learning,Operating Systems Design and Implementation,,,2016,article,en,6353,"['Abadi M.', 'Barham P.', 'Chen J.', 'Chen Z.', 'Davis A.', 'Dean J.', 'Devin M.', 'Ghemawat S.', 'Irving G.', 'Isard M.', 'Kudlur M.', 'Levenberg J.', 'Monga R.', 'Moore S.', 'Murray D.', 'Steiner B.', 'Tucker P.', 'Vasudevan V.', 'Warden P.', 'Wicke M.', 'Yu Y.', 'Zheng X.']","['Martı́n Abadi', 'Paul Barham', 'Jianmin Chen', 'Zhifeng Chen', 'Andy Davis', 'Jay B. Dean', 'Matthieu Devin', 'Sanjay Ghemawat', 'Geoffrey Irving', 'Michael Isard', 'Manjunath Kudlur', 'Josh Levenberg', 'Rajat Monga', 'Sherry Moore', 'Derek G. Murray', 'Benoit Steiner', 'Paul A. Tucker', 'Vijay Vasudevan', 'Pete Warden', 'Martin Wicke', 'Yuan Yu', 'Xiaoqiang Zheng']","['Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)']",,"['W104184427', 'W145476170', 'W1425731158', 'W1442374986', 'W1485981043', 'W1493893823', 'W1498436455', 'W1526734559', 'W1539309091', 'W1548328233', 'W1598866093', 'W1658008008', 'W1667652561', 'W1815076433', 'W1947291763', 'W1978660892', 'W2016053056', 'W2032036568', 'W2035424729', 'W2041517243', 'W2061570747', 'W2064675550', 'W2066443755', 'W2083842231', 'W2097117768', 'W2100664567', 'W2100830825', 'W2117539524', 'W2122465391', 'W2131975293', 'W2132339004', 'W2140833774', 'W2141992894', 'W2145339207', 'W2146502635', 'W2146757372', 'W2147527908', 'W2160815625', 'W2168231600', 'W2172654076', 'W2186615578', 'W2194775991', 'W2253807446', 'W2259472270', 'W2336650964', 'W2339765813', 'W2384495648', 'W2521218765', 'W2525778437', 'W2618530766', 'W2949117887', 'W2949888546', 'W2950577311', 'W2951781666', 'W2962844195']","['Dataflow', 'Computer science', 'Artificial intelligence', 'Multi-core processor', 'Machine learning', 'Computer architecture', 'Deep learning', 'Scalability', 'Inference', 'Artificial neural network', 'Dataflow architecture', 'Computation', 'Distributed computing', 'Parallel computing', 'Programming language', 'Operating system']","['Dataflow', 'Computer science', 'Artificial intelligence', 'Multi-core processor', 'Machine learning', 'Computer architecture', 'Deep learning', 'Scalability', 'Inference', 'Artificial neural network', 'Dataflow architecture', 'Computation', 'Distributed computing', 'Parallel computing', 'Programming language', 'Operating system']",,,,265,283,Abadi 2016 Operating VV0,Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States),Google (United States),Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States)
+OPENALEX,https://openalex.org/W2155653793,10.1016/s0031-3203(96)00142-2,,The use of the area under the ROC curve in the evaluation of machine learning algorithms,Pattern Recognition,,,1997,article,en,7222,['Bradley A.'],['Andrew P. Bradley'],['University of Queensland'],,"['W102612133', 'W1479940792', 'W1488460165', 'W1489095897', 'W1515026043', 'W1533986854', 'W1541145887', 'W1587362683', 'W1588861010', 'W1594031697', 'W1623080549', 'W1704669313', 'W1770825568', 'W1784695092', 'W1967760155', 'W1969341260', 'W1969557815', 'W1983523174', 'W1989164753', 'W1995023359', 'W2002096058', 'W2026980413', 'W2049172236', 'W2050206309', 'W2060136512', 'W2102150307', 'W2110323455', 'W2116939452', 'W2117897510', 'W2125055259', 'W2135346934', 'W2145224695', 'W2157825442', 'W2322002063', 'W2766736793', 'W2921629193', 'W2988864014', 'W3015981925', 'W3085162807', 'W3137161744', 'W4233107852', 'W4254952533', 'W4300993416', 'W4400445037', 'W6629338572', 'W6632481002', 'W6635398855', 'W6642591540', 'W6650814897', 'W6676534550', 'W6682610290', 'W7020983598']","['Algorithm', 'Receiver operating characteristic', 'Machine learning', 'Artificial intelligence', 'Perceptron', 'Computer science', 'Discriminant', 'Multilayer perceptron', 'Mathematics', 'Artificial neural network']","['Algorithm', 'Receiver operating characteristic', 'Machine learning', 'Artificial intelligence', 'Perceptron', 'Computer science', 'Discriminant', 'Multilayer perceptron', 'Mathematics', 'Artificial neural network']",,30,7,1145,1159,Bradley 1997 Pattern V30,University of Queensland,University of Queensland,University of Queensland
+OPENALEX,https://openalex.org/W1506806321,,,Pattern Recognition and Machine Learning (Information Science and Statistics),Springer eBooks,,,2006,book,en,8357,['Bishop C.'],['Chris Bishop'],[],,[],"['Artificial intelligence', 'Computer science', 'Statistics', 'Pattern recognition (psychology)', 'Machine learning', 'Mathematics']","['Artificial intelligence', 'Computer science', 'Statistics', 'Pattern recognition (psychology)', 'Machine learning', 'Mathematics']",,,,,,Bishop 2006 Springer VV0,,,
+OPENALEX,https://openalex.org/W2009086942,10.1198/tech.2007.s518,,Pattern Recognition and Machine Learning,Technometrics,,,2007,article,en,4652,['Neal R.'],['Radford M. Neal'],['University of Toronto'],,[],"['Artificial intelligence', 'Computer science', 'Machine learning', 'Pattern recognition (psychology)']","['Artificial intelligence', 'Computer science', 'Machine learning', 'Pattern recognition (psychology)']",,49,3,366,366,Neal 2007 Technometrics V49,University of Toronto,University of Toronto,University of Toronto
+OPENALEX,https://openalex.org/W2131241448,10.48550/arxiv.1206.2944,,Practical Bayesian Optimization of Machine Learning Algorithms,arXiv (Cornell University),,,2012,preprint,en,5669,"['Snoek J.', 'Larochelle H.', 'Adams R.']","['Jasper Snoek', 'Hugo Larochelle', 'Ryan P. Adams']","['University of Toronto', 'Université de Sherbrooke', 'Harvard University']",,"['W60686164', 'W78356000', 'W84569508', 'W1497675750', 'W1746819321', 'W1973333099', 'W2061144551', 'W2097998348', 'W2099201756', 'W2106411961', 'W2106869737', 'W2119595900', 'W2129458072', 'W2132984949', 'W2141125852', 'W2147196093', 'W2151238122', 'W2165599843', 'W2189424119', 'W2197776371', 'W2951665052', 'W2964172739', 'W3118608800']","['Bayesian optimization', 'Computer science', 'Bayesian probability', 'Machine learning', 'Artificial intelligence', 'Optimization algorithm', 'Algorithm', 'Mathematical optimization', 'Mathematics']","['Bayesian optimization', 'Computer science', 'Bayesian probability', 'Machine learning', 'Artificial intelligence', 'Optimization algorithm', 'Algorithm', 'Mathematical optimization', 'Mathematics']",,,,,,Snoek 2012 arXiv VV0,University of Toronto;Université de Sherbrooke;Harvard University,University of Toronto,University of Toronto;Université de Sherbrooke;Harvard University
+OPENALEX,https://openalex.org/W2884430236,10.1038/s41586-018-0337-2,30046072,Machine learning for molecular and materials science,Nature,,,2018,review,en,4508,"['Butler K.', 'Davies D.', 'Cartwright H.', 'Isayev O.', 'Walsh A.']","['Keith T. Butler', 'Daniel W. Davies', 'Hugh Cartwright', 'Olexandr Isayev', 'Aron Walsh']","['Research Complex at Harwell', 'Rutherford Appleton Laboratory', 'University of Bath', 'University of Oxford', 'University of North Carolina at Chapel Hill', 'Yonsei University']",,"['W617139115', 'W639205477', 'W1491105865', 'W1492999010', 'W1510073064', 'W1565640256', 'W1625305535', 'W1710476689', 'W1757990252', 'W1865667476', 'W1968761064', 'W1976492731', 'W1979769287', 'W1982589276', 'W1982598895', 'W1992985800', 'W1997974358', 'W2007400012', 'W2020786104', 'W2025679679', 'W2030843415', 'W2030976617', 'W2032026767', 'W2034097448', 'W2036524141', 'W2052226480', 'W2052891002', 'W2057069496', 'W2058452634', 'W2063007245', 'W2067250248', 'W2074616700', 'W2076063813', 'W2081413236', 'W2083415705', 'W2104489082', 'W2123306226', 'W2124234891', 'W2127168465', 'W2128245586', 'W2134164499', 'W2138178257', 'W2157886206', 'W2164524421', 'W2173027866', 'W2194321275', 'W2217912240', 'W2230728100', 'W2279490987', 'W2310703973', 'W2324964582', 'W2325264655', 'W2328928309', 'W2337082154', 'W2338402873', 'W2346180883', 'W2346400664', 'W2347129741', 'W2349487082', 'W2418973097', 'W2468638527', 'W2477622860', 'W2478294658', 'W2503662290', 'W2509907061', 'W2520022941', 'W2520500207', 'W2521267242', 'W2525748878', 'W2531602199', 'W2537064446', 'W2540627216', 'W2541404351', 'W2559394418', 'W2565684601', 'W2571050567', 'W2580919858', 'W2591366729', 'W2599053724', 'W2606044016', 'W2611413954', 'W2618625858', 'W2619580215', 'W2620846205', 'W2621738901', 'W2621742623', 'W2734520197', 'W2740407088', 'W2746244909', 'W2747592475', 'W2752180799', 'W2753962198', 'W2766362701', 'W2789615344', 'W2951016506', 'W2963094133', 'W2964113829', 'W2964116922', 'W2964217201', 'W3037315640', 'W3099950071', 'W4240502307', 'W4252359241', 'W6637568146', 'W6730103093', 'W6735944222', 'W6910696677']","['Computer science', 'Field (mathematics)', 'Data science', 'Characterization (materials science)', 'Domain (mathematical analysis)', 'Artificial intelligence', 'Cognitive science', 'Nanotechnology', 'Machine learning', 'Psychology', 'Materials science']","['Computer science', 'Field (mathematics)', 'Data science', 'Characterization (materials science)', 'Domain (mathematical analysis)', 'Artificial intelligence', 'Cognitive science', 'Nanotechnology', 'Machine learning', 'Psychology', 'Materials science', 'Mathematics', 'Mathematical analysis', 'Pure mathematics']",,559,7715,547,555,Butler 2018 Nature V559,Research Complex at Harwell;Rutherford Appleton Laboratory;University of Bath;University of Oxford;University of North Carolina at Chapel Hill;Yonsei University,Research Complex at Harwell,Research Complex at Harwell;Rutherford Appleton Laboratory;University of Bath;University of Oxford;University of North Carolina at Chapel Hill;Yonsei University
+OPENALEX,https://openalex.org/W2934399013,10.1056/nejmra1814259,30943338,Machine Learning in Medicine,New England Journal of Medicine,,,2019,review,en,3946,"['Rajkomar A.', 'Dean J.', 'Kohane I.']","['Alvin Rajkomar', 'Jay B. Dean', 'Isaac S. Kohane']","['Google (United States)', 'Google (United States)', 'Google (United States)', 'Harvard University']",,"['W1524493166', 'W1529983430', 'W2005440935', 'W2009184733', 'W2009954208', 'W2027540165', 'W2033163059', 'W2033609349', 'W2043092953', 'W2054076956', 'W2083721602', 'W2096849439', 'W2103018059', 'W2103889389', 'W2119472226', 'W2137767404', 'W2147246123', 'W2166187912', 'W2167414941', 'W2174931596', 'W2267932926', 'W2276530525', 'W2337116044', 'W2415841860', 'W2468431774', 'W2512902140', 'W2515682654', 'W2528491735', 'W2530247697', 'W2548723212', 'W2557738935', 'W2581082771', 'W2598272139', 'W2732701910', 'W2734356183', 'W2738975713', 'W2740060821', 'W2752747624', 'W2753059860', 'W2754518417', 'W2758348074', 'W2762741128', 'W2772246530', 'W2772723798', 'W2782945064', 'W2784499877', 'W2785268987', 'W2785526886', 'W2788633781', 'W2789894922', 'W2790444357', 'W2791819448', 'W2792902933', 'W2793267369', 'W2794457162', 'W2799837895', 'W2804685074', 'W2809453031', 'W2886281300', 'W2887623535', 'W2887719255', 'W2888109941', 'W2889242407', 'W2889494558', 'W2894917609', 'W2896385413', 'W2896817483', 'W2897434820', 'W2899560923', 'W2902802452', 'W2908201961', 'W2914579361', 'W2916105049', 'W2919115771', 'W3098949126', 'W4205374244', 'W4212774754', 'W4296220420']","['Download', 'Computer science', 'Data science', 'Medicine', 'Medical education', 'Artificial intelligence', 'World Wide Web']","['Download', 'Computer science', 'Data science', 'Medicine', 'Medical education', 'Artificial intelligence', 'World Wide Web']",,380,14,1347,1358,Rajkomar 2019 New V380,Google (United States);Google (United States);Google (United States);Harvard University,Google (United States),Google (United States);Google (United States);Google (United States);Harvard University
+OPENALEX,https://openalex.org/W2913668833,,,Proceedings of the 25th international conference on Machine learning,,,,2008,article,en,5549,"['Cohen W.', 'McCallum A.', 'Roweis S.']","['William W. Cohen', 'Andrew McCallum', 'Sam T. Roweis']","['Carnegie Mellon University', 'University of Massachusetts Amherst', 'Google (United States)', 'University of Toronto']",,[],"['Presentation (obstetrics)', 'Library science', 'Computer science', 'Medical education', 'Artificial intelligence', 'Medicine']","['Presentation (obstetrics)', 'Library science', 'Computer science', 'Medical education', 'Artificial intelligence', 'Medicine', 'Radiology']",,,,,,Cohen 2008 UNKNOWNJ VV0,Carnegie Mellon University;University of Massachusetts Amherst;Google (United States);University of Toronto,Carnegie Mellon University,Carnegie Mellon University;University of Massachusetts Amherst;Google (United States);University of Toronto
+OPENALEX,https://openalex.org/W2149684865,10.1007/bfb0026683,,Text categorization with Support Vector Machines: Learning with many relevant features,Lecture notes in computer science,,,1998,book-chapter,en,7984,['Joachims T.'],['Thorsten Joachims'],['TU Dortmund University'],,"['W740415', 'W1504694836', 'W1978394996', 'W2023677852', 'W2087614174', 'W2096152098', 'W2114535528', 'W2119821739', 'W2125055259', 'W2149684865', 'W2156909104', 'W2164547069', 'W2435251607', 'W6821113053']","['Support vector machine', 'Computer science', 'Machine learning', 'Artificial intelligence', 'Categorization', 'Text categorization', 'Task (project management)', 'Variety (cybernetics)', 'Empirical research', 'Relevance vector machine', 'Mathematics']","['Support vector machine', 'Computer science', 'Machine learning', 'Artificial intelligence', 'Categorization', 'Text categorization', 'Task (project management)', 'Variety (cybernetics)', 'Empirical research', 'Relevance vector machine', 'Mathematics', 'Statistics', 'Management', 'Economics']",,,,137,142,Joachims 1998 Lecture VV0,TU Dortmund University,TU Dortmund University,TU Dortmund University
+OPENALEX,https://openalex.org/W1485009520,10.48550/arxiv.1506.04214,,Convolutional LSTM Network: A Machine Learning Approach for Precipitation Nowcasting,arXiv (Cornell University),,,2015,preprint,en,6647,"['Shi X.', 'Chen Z.', 'Wang H.', 'Yeung D.', 'Wong W.', 'Woo W.']","['Xingjian Shi', 'Zhourong Chen', 'Hao Wang', 'Dit‐Yan Yeung', 'Wai Kin Wong', 'Wang‐chun Woo']","['Hong Kong University of Science and Technology', 'Hong Kong University of Science and Technology', 'Hong Kong University of Science and Technology', 'Hong Kong University of Science and Technology', 'Hong Kong Observatory', 'Hong Kong Observatory']",,"['W588441650', 'W962117656', 'W1514535095', 'W1568514080', 'W1606347560', 'W1810943226', 'W1815076433', 'W1867429401', 'W1903029394', 'W1905882502', 'W1947481528', 'W1982479097', 'W2024414272', 'W2030459037', 'W2064675550', 'W2079565659', 'W2116435618', 'W2130942839', 'W2157331557', 'W2557283755', 'W2787727108', 'W2950635152', 'W2951183276', 'W2952453038', 'W4233546237', 'W4294306266', 'W4308909683']","['Nowcasting', 'Computer science', 'Convolutional neural network', 'Artificial intelligence', 'Precipitation', 'State (computer science)', 'Machine learning', 'Perspective (graphical)', 'Pattern recognition (psychology)', 'Algorithm', 'Meteorology', 'Geography']","['Nowcasting', 'Computer science', 'Convolutional neural network', 'Artificial intelligence', 'Precipitation', 'State (computer science)', 'Machine learning', 'Perspective (graphical)', 'Pattern recognition (psychology)', 'Algorithm', 'Meteorology', 'Geography']",,,,,,Shi 2015 arXiv VV0,Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;Hong Kong Observatory;Hong Kong Observatory,Hong Kong University of Science and Technology,Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;Hong Kong Observatory;Hong Kong Observatory
+OPENALEX,https://openalex.org/W1502922572,10.1007/978-3-540-28650-9_4,,Gaussian Processes in Machine Learning,Lecture notes in computer science,,,2004,book-chapter,en,5117,['Rasmussen C.'],['Carl Edward Rasmussen'],['Max Planck Institute for Biological Cybernetics'],,"['W1657213141', 'W1746680969', 'W2117063635', 'W2129564505']","['Computer science', 'Hyperparameter', 'Gaussian process', 'Focus (optics)', 'Machine learning', 'Artificial intelligence', 'Process (computing)', 'Gaussian', 'Marginal likelihood', 'Simple (philosophy)', 'Kriging', 'Marginal distribution', 'Algorithm', 'Mathematical optimization', 'Random variable', 'Statistics', 'Mathematics']","['Computer science', 'Hyperparameter', 'Gaussian process', 'Focus (optics)', 'Machine learning', 'Artificial intelligence', 'Process (computing)', 'Gaussian', 'Marginal likelihood', 'Simple (philosophy)', 'Kriging', 'Marginal distribution', 'Algorithm', 'Mathematical optimization', 'Random variable', 'Statistics', 'Mathematics', 'Philosophy', 'Operating system', 'Optics', 'Bayesian probability', 'Epistemology', 'Physics', 'Quantum mechanics']",,,,63,71,Rasmussen 2004 Lecture VV0,Max Planck Institute for Biological Cybernetics,Max Planck Institute for Biological Cybernetics,Max Planck Institute for Biological Cybernetics
+OPENALEX,https://openalex.org/W114517082,10.1007/978-3-7908-2604-3_16,,Large-Scale Machine Learning with Stochastic Gradient Descent,,,,2010,book-chapter,en,5624,['Bottou L.'],['Léon Bottou'],['Princeton University'],,"['W1505356468', 'W1535810436', 'W1629097610', 'W2029538739', 'W2030811966', 'W2035720976', 'W2043919728', 'W2068484625', 'W2086161653', 'W2098921539', 'W2101159990', 'W2113651538', 'W2119821739', 'W2127218421', 'W2129191766', 'W2135046866', 'W2137515395', 'W2147880316', 'W2150102617', 'W2154451187', 'W2322150470', 'W2416173357', 'W2766736793', 'W2990138404', 'W3207342693', 'W4238284510']","['Stochastic gradient descent', 'Computer science', 'Scale (ratio)', 'Stochastic optimization', 'Gradient descent', 'Set (abstract data type)', 'Online machine learning', 'Context (archaeology)', 'Sample (material)', 'Artificial intelligence', 'Algorithm', 'Mathematical optimization', 'Machine learning', 'Mathematics', 'Active learning (machine learning)', 'Artificial neural network']","['Stochastic gradient descent', 'Computer science', 'Scale (ratio)', 'Stochastic optimization', 'Gradient descent', 'Set (abstract data type)', 'Online machine learning', 'Context (archaeology)', 'Sample (material)', 'Artificial intelligence', 'Algorithm', 'Mathematical optimization', 'Machine learning', 'Mathematics', 'Active learning (machine learning)', 'Artificial neural network', 'Programming language', 'Chromatography', 'Paleontology', 'Physics', 'Chemistry', 'Biology', 'Quantum mechanics']",,,,177,186,Bottou 2010 UNKNOWNJ VV0,Princeton University,Princeton University,Princeton University
+OPENALEX,https://openalex.org/W1680797894,10.1007/978-0-387-30164-8,,Encyclopedia of Machine Learning,,,,2010,book,en,3462,['Sammut C.'],['Claude Sammut'],['UNSW Sydney'],,[],"['Encyclopedia', 'Computer science', 'Artificial intelligence', 'Data science', 'Library science']","['Encyclopedia', 'Computer science', 'Artificial intelligence', 'Data science', 'Library science']",,,,,,Sammut 2010 UNKNOWNJ VV0,UNSW Sydney,UNSW Sydney,UNSW Sydney
+OPENALEX,https://openalex.org/W2945976633,10.1038/s42256-019-0048-x,35603010,Stop explaining black box machine learning models for high stakes decisions and use interpretable models instead,Nature Machine Intelligence,,,2019,article,en,8911,['Rudin C.'],['Cynthia Rudin'],['Duke University'],,"['W1492170170', 'W1537462412', 'W1731081199', 'W1746506709', 'W1905782493', 'W1973682096', 'W1984314602', 'W1994407253', 'W2013587512', 'W2026905436', 'W2046945713', 'W2072136246', 'W2082262280', 'W2132166479', 'W2134598164', 'W2141097525', 'W2149033360', 'W2163598528', 'W2239135493', 'W2248060815', 'W2467510144', 'W2493343568', 'W2579555219', 'W2604231045', 'W2613140028', 'W2621305858', 'W2743731382', 'W2752988282', 'W2765813195', 'W2767442356', 'W2778670458', 'W2798857668', 'W2811104224', 'W2811374795', 'W2894881080', 'W2895051075', 'W2896176822', 'W2898694742', 'W2899360465', 'W2901939789', 'W2902991393', 'W2910705748', 'W2962689739', 'W2963125461', 'W2963533879', 'W2963816926', 'W2964134873', 'W2964180856', 'W3085162807', 'W3098636317', 'W3102221121', 'W3102834905', 'W3122175177', 'W4234008654', 'W6743543778']","['Black box', 'Harm', 'Computer science', 'Key (lock)', 'Criminal justice', 'Artificial intelligence', 'Economic Justice', 'Machine learning', 'Data science', 'Criminology', 'Psychology', 'Computer security', 'Political science', 'Social psychology', 'Law']","['Black box', 'Harm', 'Computer science', 'Key (lock)', 'Criminal justice', 'Artificial intelligence', 'Economic Justice', 'Machine learning', 'Data science', 'Criminology', 'Psychology', 'Computer security', 'Political science', 'Social psychology', 'Law']",,1,5,206,215,Rudin 2019 Nature V1,Duke University,Duke University,Duke University
+OPENALEX,https://openalex.org/W2177870565,10.1161/circulationaha.115.001593,26572668,Machine Learning in Medicine,Circulation,,,2015,review,en,3408,['Deo R.'],['Rahul C. Deo'],['QB3'],,"['W40442397', 'W1480376833', 'W1678356000', 'W1808991731', 'W1902027874', 'W1976196376', 'W2011999110', 'W2021701428', 'W2029243817', 'W2052825782', 'W2072128103', 'W2073751243', 'W2105464873', 'W2106665921', 'W2110243528', 'W2112289645', 'W2112592817', 'W2113606819', 'W2116802246', 'W2119361626', 'W2120480077', 'W2121495423', 'W2122111042', 'W2127482775', 'W2135046866', 'W2139212933', 'W2147461734', 'W2149298154', 'W2152072062', 'W2158927033', 'W2162586165', 'W2163697531', 'W2164434252', 'W2345255551', 'W2787894218', 'W2911964244', 'W2912934387', 'W2963481018', 'W2998216295', 'W3099478002', 'W4212883601', 'W4231109964', 'W4243607236', 'W4285719527', 'W6601599523', 'W6676903177', 'W7066667914']","['Medicine', 'Medical physics', 'Medical education', 'Intensive care medicine']","['Medicine', 'Medical physics', 'Medical education', 'Intensive care medicine']",,132,20,1920,1930,Deo 2015 Circulation V132,QB3,QB3,QB3
+OPENALEX,https://openalex.org/W2619383789,10.1109/tpami.2018.2798607,29994351,Multimodal Machine Learning: A Survey and Taxonomy,IEEE Transactions on Pattern Analysis and Machine Intelligence,,,2018,article,en,4206,"['Baltrušaitis T.', 'Ahuja C.', 'Morency L.']","['Tadas Baltrušaitis', 'Chaitanya Ahuja', 'Louis‐Philippe Morency']","['Microsoft Research (United Kingdom)', 'Carnegie Mellon University', 'Carnegie Mellon University']",,"['W8316075', 'W21006490', 'W22229905', 'W59175527', 'W68733909', 'W129606432', 'W155596317', 'W189596042', 'W199018803', 'W262578090', 'W854541894', 'W877909479', 'W956551720', 'W1123427201', 'W1480583224', 'W1481820510', 'W1488163396', 'W1503933356', 'W1514535095', 'W1522301498', 'W1523385540', 'W1527575280', 'W1528056001', 'W1533861849', 'W1540429825', 'W1555767263', 'W1566289585', 'W1572567476', 'W1573040851', 'W1586939924', 'W1601567445', 'W1628307106', 'W1651753422', 'W1664311846', 'W1686810756', 'W1687846465', 'W1753482797', 'W1762503104', 'W1766290689', 'W1773149199', 'W1811254738', 'W1822526425', 'W1828348983', 'W1836465849', 'W1858383477', 'W1870428314', 'W1872883209', 'W1883346539', 'W1889038981', 'W1889081078', 'W1893116441', 'W1895577753', 'W1897761818', 'W1905882502', 'W1906515132', 'W1922557984', 'W1931795219', 'W1933065844', 'W1933349210', 'W1956340063', 'W1963540633', 'W1964073652', 'W1966811077', 'W1969616664', 'W1970055505', 'W1971791733', 'W1976066595', 'W1977547683', 'W1985867508', 'W1986451414', 'W1987835821', 'W1996418862', 'W1996478295', 'W2000911139', 'W2003333103', 'W2006969979', 'W2009059481', 'W2012237712', 'W2015394094', 'W2015412875', 'W2019024625', 'W2022799064', 'W2025341678', 'W2025638820', 'W2026012689', 'W2026243162', 'W2038698865', 'W2041288440', 'W2042608483', 'W2048343491', 'W2048679005', 'W2051721233', 'W2053101950', 'W2057568625', 'W2058616948', 'W2061781940', 'W2062632672', 'W2062955551', 'W2063036810', 'W2063330527', 'W2064675550', 'W2066667210', 'W2068676460', 'W2069682406', 'W2077395415', 'W2080576537', 'W2083885588', 'W2090048052', 'W2095705004', 'W2096391593', 'W2098411764', 'W2098562545', 'W2099471712', 'W2100235303', 'W2100561338', 'W2101105183', 'W2101534792', 'W2102765684', 'W2105103432', 'W2106277773', 'W2108710284', 'W2109586012', 'W2109743529', 'W2111078031', 'W2111645492', 'W2112019442', 'W2112184938', 'W2112912048', 'W2113507809', 'W2118714046', 'W2119288237', 'W2120776756', 'W2123024445', 'W2124033848', 'W2124372976', 'W2125336414', 'W2125366733', 'W2126598020', 'W2128856065', 'W2129142580', 'W2129360799', 'W2129382193', 'W2130055251', 'W2130162821', 'W2130942839', 'W2131179926', 'W2133459682', 'W2133564696', 'W2135776491', 'W2136922672', 'W2136985729', 'W2137735870', 'W2137806537', 'W2141477623', 'W2142192571', 'W2142900973', 'W2143449221', 'W2143492886', 'W2143612262', 'W2143926884', 'W2145056192', 'W2147880316', 'W2147885303', 'W2148298736', 'W2149172860', 'W2149557440', 'W2149940198', 'W2150295085', 'W2150658333', 'W2150696241', 'W2150824314', 'W2151096985', 'W2151103935', 'W2152239535', 'W2153579005', 'W2153927146', 'W2156303437', 'W2156503193', 'W2159973364', 'W2160815625', 'W2163108352', 'W2163605009', 'W2163922914', 'W2164186291', 'W2164450870', 'W2164587673', 'W2164699598', 'W2167103782', 'W2173180041', 'W2180844455', 'W2181691731', 'W2184045248', 'W2184188583', 'W2185175083', 'W2201007611', 'W2203543769', 'W2220981600', 'W2250742840', 'W2250842428', 'W2251353663', 'W2251394420', 'W2251885125', 'W2251970440', 'W2252122141', 'W2252238675', 'W2266728343', 'W2267126114', 'W2282219577', 'W2291822808', 'W2293453011', 'W2294797155', 'W2296613712', 'W2316138215', 'W2327501763', 'W2342662179', 'W2388114291', 'W2397159106', 'W2399507222', 'W2399733683', 'W2402955625', 'W2405756170', 'W2411037331', 'W2418349398', 'W2434537049', 'W2462496837', 'W2470413457', 'W2489434015', 'W2494980014', 'W2519091744', 'W2519656895', 'W2520160253', 'W2546919788', 'W2557865186', 'W2579317665', 'W2914699769', 'W2949465329', 'W2953318193', 'W2962706528', 'W2962756039', 'W2962835968', 'W2963082528', 'W2963109634', 'W2963143316', 'W2963192057', 'W2963260436', 'W2963324994', 'W2963383024', 'W2963389687', 'W2963410018', 'W2963576560', 'W2963579811', 'W2963605190', 'W2963656855', 'W2963735856', 'W2963811219', 'W2963899908', 'W2963954913', 'W2964040984', 'W2964118342', 'W2964121744', 'W2964217371', 'W2964241990', 'W2964308564', 'W2964345931', 'W3000384245', 'W3023993913', 'W3087871082', 'W3125032682', 'W4211232216', 'W4212844288', 'W4240592325', 'W4244018879', 'W4245655784', 'W4252331534', 'W4285719527', 'W4293665662', 'W4294170691', 'W4297813007', 'W4299801216', 'W4302613066', 'W4320013936', 'W6600334730', 'W6600827882', 'W6605295763', 'W6606244218', 'W6606327593', 'W6607775107', 'W6608183366', 'W6623517193', 'W6623995992', 'W6625044600', 'W6628794645', 'W6629203210', 'W6630875275', 'W6631190155', 'W6631216910', 'W6631516269', 'W6631943919', 'W6634126550', 'W6636447180', 'W6636942303', 'W6637306801', 'W6637373629', 'W6637698695', 'W6637971603', 'W6637989529', 'W6638549007', 'W6638667902', 'W6638742206', 'W6639103823', 'W6639118148', 'W6639283537', 'W6639358663', 'W6639432524', 'W6639434097', 'W6640257717', 'W6640296258', 'W6640764460', 'W6650605322', 'W6652311901', 'W6674330103', 'W6675048546', 'W6676380891', 'W6676497082', 'W6676647902', 'W6676709516', 'W6678360021', 'W6678470764', 'W6678809451', 'W6679434410', 'W6679436768', 'W6680094886', 'W6680336390', 'W6681184217', 'W6682082992', 'W6682086108', 'W6682222085', 'W6682511423', 'W6682691769', 'W6682864246', 'W6683074461', 'W6683167905', 'W6683277684', 'W6684191040', 'W6684209796', 'W6685183736', 'W6685527872', 'W6686207219', 'W6687543112', 'W6687672932', 'W6688143368', 'W6691419566', 'W6691647468', 'W6692004142', 'W6696843773', 'W6697449767', 'W6712426025', 'W6712802073', 'W6713645886', 'W6717487601', 'W6726977916', 'W6727336983', 'W6729831399', 'W6730042849', 'W6730666313', 'W6732843983', 'W6845679800', 'W6898505805', 'W7011438494']","['Multimodal learning', 'Computer science', 'Artificial intelligence', 'Modalities', 'Taxonomy (biology)', 'Categorization', 'Multimodality', 'Field (mathematics)', 'Machine learning', 'Human–computer interaction', 'World Wide Web']","['Multimodal learning', 'Computer science', 'Artificial intelligence', 'Modalities', 'Taxonomy (biology)', 'Categorization', 'Multimodality', 'Field (mathematics)', 'Machine learning', 'Human–computer interaction', 'World Wide Web', 'Pure mathematics', 'Sociology', 'Social science', 'Botany', 'Mathematics', 'Biology']",,41,2,423,443,Baltrušaitis 2018 IEEE V41,Microsoft Research (United Kingdom);Carnegie Mellon University;Carnegie Mellon University,Microsoft Research (United Kingdom),Microsoft Research (United Kingdom);Carnegie Mellon University;Carnegie Mellon University
+OPENALEX,https://openalex.org/W3135028703,10.1007/s42979-021-00592-x,33778771,"Machine Learning: Algorithms, Real-World Applications and Research Directions",SN Computer Science,,,2021,review,en,5105,['Sarker I.'],['Iqbal H. Sarker'],"['Chittagong University of Engineering & Technology', 'Swinburne University of Technology']",,"['W4952878', 'W28669376', 'W44815768', 'W1128809682', 'W1484413656', 'W1484780623', 'W1491541693', 'W1498810706', 'W1508065755', 'W1515231270', 'W1543320899', 'W1566114229', 'W1570448133', 'W1594031697', 'W1629143244', 'W1673310716', 'W1806329564', 'W1912123407', 'W1917795079', 'W1927026191', 'W1948199107', 'W1965702297', 'W1967661515', 'W1974016210', 'W1977496278', 'W1981276685', 'W1982582425', 'W1989344766', 'W1990517717', 'W2015057666', 'W2018936209', 'W2026513874', 'W2058401212', 'W2064853889', 'W2069140227', 'W2071128523', 'W2083620785', 'W2088093492', 'W2090991262', 'W2097117768', 'W2099404336', 'W2099940443', 'W2101234009', 'W2106393550', 'W2107726111', 'W2109255472', 'W2112076978', 'W2112796928', 'W2119567691', 'W2120240539', 'W2120636621', 'W2127218421', 'W2132166479', 'W2134089414', 'W2140190241', 'W2142827986', 'W2143554828', 'W2144219012', 'W2147169507', 'W2149706766', 'W2151040995', 'W2154298720', 'W2160642098', 'W2163605009', 'W2164500538', 'W2166559705', 'W2194775991', 'W2215376118', 'W2257979135', 'W2294798173', 'W2296509296', 'W2341117600', 'W2394309960', 'W2395579298', 'W2504658994', 'W2510496529', 'W2518882834', 'W2531409750', 'W2557283755', 'W2580909119', 'W2581465409', 'W2603678388', 'W2609368436', 'W2617585083', 'W2617697157', 'W2622382573', 'W2713640100', 'W2724111113', 'W2752236180', 'W2762644836', 'W2771053518', 'W2802574842', 'W2803881474', 'W2806407311', 'W2889193967', 'W2904346290', 'W2906027675', 'W2909445826', 'W2910891387', 'W2911964244', 'W2912934387', 'W2913771179', 'W2940523548', 'W2950722229', 'W2954936648', 'W2955285339', 'W2960015156', 'W2962824709', 'W2963748489', 'W2971145443', 'W2982291760', 'W2990933508', 'W2991970757', 'W2998019206', 'W2998574808', 'W2999729612', 'W3002041203', 'W3003734944', 'W3007397514', 'W3011204221', 'W3014867431', 'W3016540417', 'W3017881119', 'W3019166713', 'W3023402713', 'W3034560014', 'W3037163353', 'W3038955483', 'W3039828206', 'W3041463877', 'W3044397306', 'W3044730720', 'W3049757379', 'W3083228182', 'W3084246142', 'W3085162807', 'W3086286002', 'W3095217282', 'W3099185017', 'W3100378204', 'W3102116369', 'W3121263745', 'W3122594683', 'W3129290453', 'W3130145150', 'W3139008799', 'W3149084432', 'W4212883601', 'W4230470477', 'W4236137412', 'W4244238212', 'W4245160364', 'W4298023569', 'W4298882835', 'W6601142415', 'W6674887505', 'W6675354045', 'W6675567579', 'W6676769703', 'W6843735874']","['Computer science', 'Artificial intelligence', 'Machine learning', 'Key (lock)', 'Big data', 'Data science', 'Data mining', 'Computer security']","['Computer science', 'Artificial intelligence', 'Machine learning', 'Key (lock)', 'Big data', 'Data science', 'Data mining', 'Computer security']",,2,3,160,160,Sarker 2021 SN V2,Chittagong University of Engineering & Technology;Swinburne University of Technology,Chittagong University of Engineering & Technology,Chittagong University of Engineering & Technology;Swinburne University of Technology
+OPENALEX,https://openalex.org/W2750384547,10.48550/arxiv.1708.07747,,Fashion-MNIST: a Novel Image Dataset for Benchmarking Machine Learning Algorithms,arXiv (Cornell University),,,2017,preprint,en,6087,"['Han X.', 'Rasul K.', 'Vollgraf R.']","['Xiao, Han', 'Kashif Rasul', 'Roland Vollgraf']",[],,"['W4919037', 'W2112796928', 'W2590796488']","['MNIST database', 'Benchmarking', 'Artificial intelligence', 'Grayscale', 'Computer science', 'Set (abstract data type)', 'Test set', 'Pattern recognition (psychology)', 'Image (mathematics)', 'Machine learning', 'Algorithm', 'Deep learning']","['MNIST database', 'Benchmarking', 'Artificial intelligence', 'Grayscale', 'Computer science', 'Set (abstract data type)', 'Test set', 'Pattern recognition (psychology)', 'Image (mathematics)', 'Machine learning', 'Algorithm', 'Deep learning', 'Programming language', 'Business', 'Marketing']",,,,,,Han 2017 arXiv VV0,,,
+OPENALEX,https://openalex.org/W2560674852,10.1145/1390156,,Proceedings of the 25th international conference on Machine learning - ICML '08,,,,2008,paratext,en,6716,[],[],[],,[],"['Computer science', 'Artificial intelligence']","['Computer science', 'Artificial intelligence']",,,,,,UNKNOWN 2008 UNKNOWNJ VV0,,,
+OPENALEX,https://openalex.org/W1873332500,,,Supervised Machine Learning: A Review of Classification Techniques,,,,2007,review,en,4147,['Kotsiantis S.'],['Sotiris Kotsiantis'],['University of Peloponnese'],,"['W5472403', 'W135311109', 'W177590838', 'W203696055', 'W1007293483', 'W1497605902', 'W1506588750', 'W1515851193', 'W1520605446', 'W1522114398', 'W1528113134', 'W1537143578', 'W1538041071', 'W1547833367', 'W1554309553', 'W1560955742', 'W1562368284', 'W1563088657', 'W1567012231', 'W1570329253', 'W1570448133', 'W1570706771', 'W1587647246', 'W1588516554', 'W1594031697', 'W1594781927', 'W1602492977', 'W1605688901', 'W1605844890', 'W1637435380', 'W1670263352', 'W1671614046', 'W1746680969', 'W1780185704', 'W1808644423', 'W1813387235', 'W1817561967', 'W1827261456', 'W1904009171', 'W1935515061', 'W1973991804', 'W1974545290', 'W1979711143', 'W1983479840', 'W1983690667', 'W1986883011', 'W1992419399', 'W1993066733', 'W2006345381', 'W2011101028', 'W2016441117', 'W2022058268', 'W2026718556', 'W2037322594', 'W2046649434', 'W2050829396', 'W2063783806', 'W2074584355', 'W2075932270', 'W2093825590', 'W2096756482', 'W2104333211', 'W2110179049', 'W2119479037', 'W2120199131', 'W2122111042', 'W2122496402', 'W2123623606', 'W2125055259', 'W2126333738', 'W2128912745', 'W2133160781', 'W2133218851', 'W2133632100', 'W2136000097', 'W2136132422', 'W2137130182', 'W2139212933', 'W2140586694', 'W2140785063', 'W2142857211', 'W2143603257', 'W2144731007', 'W2145467382', 'W2145680191', 'W2150796457', 'W2151450140', 'W2156440942', 'W2156571267', 'W2156909104', 'W2157815868', 'W2158724449', 'W2159895197', 'W2161349318', 'W2161782846', 'W2161960932', 'W2164359548', 'W2166985738', 'W2167277498', 'W2167467747', 'W2168754135', 'W2171265988', 'W2172429451', 'W2322002063', 'W2488399954', 'W2603390332', 'W2766736793', 'W2911678770', 'W2912276539', 'W2912934387', 'W3015462599']","['Machine learning', 'Artificial intelligence', 'Computer science', 'Classifier (UML)', 'Supervised learning', 'One-class classification', 'Class (philosophy)', 'Semi-supervised learning', 'Artificial neural network']","['Machine learning', 'Artificial intelligence', 'Computer science', 'Classifier (UML)', 'Supervised learning', 'One-class classification', 'Class (philosophy)', 'Semi-supervised learning', 'Artificial neural network']",,160,3,249,24,Kotsiantis 2007 UNKNOWNJ V160,University of Peloponnese,University of Peloponnese,University of Peloponnese
+OPENALEX,https://openalex.org/W4236362309,10.1017/cbo9781107298019,,Understanding Machine Learning,Cambridge University Press eBooks,,,2014,book,en,2918,"['Shalev‐Shwartz S.', 'Ben-David S.']","['Shai Shalev‐Shwartz', 'Shai Ben-David']","['Hebrew University of Jerusalem', 'University of Waterloo']",,[],"['Computer science', 'Artificial intelligence', 'Stability (learning theory)', 'Algorithmic learning theory', 'Computational learning theory', 'Machine learning', 'Presentation (obstetrics)', 'Stochastic gradient descent', 'Convexity', 'Online machine learning', 'Artificial neural network']","['Computer science', 'Artificial intelligence', 'Stability (learning theory)', 'Algorithmic learning theory', 'Computational learning theory', 'Machine learning', 'Presentation (obstetrics)', 'Stochastic gradient descent', 'Convexity', 'Online machine learning', 'Artificial neural network', 'Medicine', 'Economics', 'Financial economics', 'Radiology']",,,,,,Shalev‐Shwartz 2014 Cambridge VV0,Hebrew University of Jerusalem;University of Waterloo,Hebrew University of Jerusalem,Hebrew University of Jerusalem;University of Waterloo
+OPENALEX,https://openalex.org/W3198350258,10.1147/rd.33.0210,,Some Studies in Machine Learning Using the Game of Checkers,IBM Journal of Research and Development,,,1959,article,en,4346,['Samuel A.'],['Arthur L. Samuel'],[],,[],"['Computer science', 'Artificial intelligence', 'Machine learning']","['Computer science', 'Artificial intelligence', 'Machine learning']",,3,3,210,229,Samuel 1959 IBM V3,,,
+OPENALEX,https://openalex.org/W2535690855,10.1109/sp.2017.41,,Membership Inference Attacks Against Machine Learning Models,,,,2017,article,en,4211,"['Shokri R.', 'Stronati M.', 'Song C.', 'Shmatikov V.']","['Reza Shokri', 'Marco Stronati', 'Congzheng Song', 'Vitaly Shmatikov']","['Cornell University', 'Institut national de recherche en sciences et technologies du numérique', 'Cornell University', 'Cornell University']",,"['W1473189865', 'W1510952750', 'W1528076390', 'W1535019556', 'W1554944419', 'W1760458529', 'W1811750039', 'W1821462560', 'W1826232489', 'W1873763122', 'W1992926795', 'W2009733253', 'W2024594469', 'W2040228409', 'W2051267297', 'W2053637704', 'W2077905990', 'W2095272373', 'W2095705004', 'W2096633407', 'W2106313770', 'W2106463421', 'W2112380340', 'W2114229504', 'W2119874464', 'W2123147099', 'W2130051287', 'W2151320232', 'W2162379889', 'W2186645727', 'W2198253679', 'W2329660289', 'W2461943168', 'W2473418344', 'W2532520288', 'W2950943617', 'W2951114885', 'W2962835266', 'W2963794891', 'W2964318098', 'W3118608800', 'W3215186461', 'W4248649186', 'W6628547770', 'W6631628602', 'W6632160336', 'W6638214083', 'W6639246211', 'W6661425395', 'W6674330103', 'W6676639149', 'W6677855611', 'W6686761782', 'W6731627051']","['Inference', 'Machine learning', 'Computer science', 'Artificial intelligence', 'Perspective (graphical)', 'Focus (optics)', 'Data modeling', 'Data mining', 'Adversarial system', 'Database']","['Inference', 'Machine learning', 'Computer science', 'Artificial intelligence', 'Perspective (graphical)', 'Focus (optics)', 'Data modeling', 'Data mining', 'Adversarial system', 'Database', 'Optics', 'Physics']",,,,3,18,Shokri 2017 UNKNOWNJ VV0,Cornell University;Institut national de recherche en sciences et technologies du numérique;Cornell University;Cornell University,Cornell University,Cornell University;Institut national de recherche en sciences et technologies du numérique;Cornell University;Cornell University
+OPENALEX,https://openalex.org/W1532362218,10.1007/11744023_34,,Machine Learning for High-Speed Corner Detection,Lecture notes in computer science,,,2006,book-chapter,en,4373,"['Rosten E.', 'Drummond T.']","['Edward Rosten', 'Tom Drummond']","['University of Cambridge', 'University of Cambridge']",,"['W1505641881', 'W1541642243', 'W1564419782', 'W1580529010', 'W1639227073', 'W1676552347', 'W1773272891', 'W1926270821', 'W1970393892', 'W2000701155', 'W2003262222', 'W2012778485', 'W2048677751', 'W2059389571', 'W2069295011', 'W2075746031', 'W2099046646', 'W2111308925', 'W2111589119', 'W2114785422', 'W2115168188', 'W2119747362', 'W2130103520', 'W2148278638', 'W2149706766', 'W2151103935', 'W2162430761', 'W2163205713', 'W2166221155', 'W2169741726', 'W2914011225', 'W2999811158', 'W6733008967']","['Detector', 'Scale-invariant feature transform', 'Computer science', 'Frame rate', 'Artificial intelligence', 'Corner detection', 'Frame (networking)', 'Feature (linguistics)', 'Computer vision', 'Process (computing)', 'Speedup', 'Feature extraction', 'Pattern recognition (psychology)', 'Image (mathematics)', 'Telecommunications']","['Detector', 'Scale-invariant feature transform', 'Computer science', 'Frame rate', 'Artificial intelligence', 'Corner detection', 'Frame (networking)', 'Feature (linguistics)', 'Computer vision', 'Process (computing)', 'Speedup', 'Feature extraction', 'Pattern recognition (psychology)', 'Image (mathematics)', 'Telecommunications', 'Operating system', 'Philosophy', 'Linguistics']",,,,430,443,Rosten 2006 Lecture VV0,University of Cambridge;University of Cambridge,University of Cambridge,University of Cambridge;University of Cambridge
+OPENALEX,https://openalex.org/W2885770726,10.3390/s18082674,30110960,Machine Learning in Agriculture: A Review,Sensors,,,2018,review,en,3023,"['Λιάκος Κ.', 'Busato P.', 'Moshou D.', 'Pearson S.', 'Bochtis D.']","['Κωνσταντίνος Λιάκος', 'Patrizia Busato', 'Dimitrios Moshou', 'Simon Pearson', 'Dionysis Bochtis']","['Centre for Research and Technology Hellas', 'University of Turin', 'Aristotle University of Thessaloniki', 'Centre for Research and Technology Hellas', 'University of Lincoln', 'Centre for Research and Technology Hellas']",,"['W94523489', 'W189596042', 'W1179140510', 'W1496317909', 'W1596717185', 'W1689445748', 'W1916445479', 'W1963579367', 'W1963790103', 'W1966124853', 'W1967320885', 'W1968452917', 'W1984530193', 'W1990517717', 'W1995341919', 'W1998871699', 'W2000972253', 'W2001619934', 'W2009986810', 'W2015263929', 'W2018435387', 'W2019207321', 'W2024081693', 'W2025279987', 'W2028606616', 'W2040104179', 'W2040870580', 'W2049633694', 'W2063304499', 'W2065165083', 'W2072680624', 'W2075320162', 'W2076857888', 'W2081544115', 'W2087877962', 'W2095727900', 'W2102201073', 'W2106855632', 'W2108703480', 'W2110642273', 'W2111072639', 'W2119821739', 'W2128084896', 'W2138178898', 'W2143908786', 'W2149723649', 'W2150593711', 'W2153476503', 'W2153635508', 'W2154350719', 'W2161673710', 'W2174918471', 'W2200121095', 'W2209382794', 'W2216013554', 'W2231576311', 'W2270460811', 'W2270641383', 'W2273322351', 'W2286091602', 'W2294798173', 'W2298521547', 'W2337945771', 'W2339447311', 'W2399675776', 'W2417395753', 'W2419137750', 'W2470803522', 'W2497210317', 'W2502044482', 'W2552660223', 'W2560811704', 'W2577148968', 'W2580808806', 'W2586821267', 'W2591104514', 'W2598645336', 'W2603364874', 'W2603417106', 'W2604196786', 'W2606244344', 'W2606916050', 'W2612828053', 'W2619390517', 'W2620473470', 'W2620542418', 'W2621525431', 'W2622758479', 'W2622999711', 'W2738911869', 'W2775111183', 'W2789255992', 'W2790639095', 'W2791690647', 'W2794415089', 'W2796501058', 'W2806779833', 'W2903950532', 'W2911964244', 'W2919115771', 'W3125807057', 'W4210451417', 'W4212883601', 'W4232670376', 'W4239510810', 'W4250143236', 'W4400360174', 'W6607775107', 'W6632223008', 'W6675321329', 'W6675436802', 'W6676769703']","['Agriculture', 'Artificial intelligence', 'Precision agriculture', 'Computer science', 'Machine learning', 'Big data', 'Livestock', 'Decision support system', 'Data science', 'Data mining']","['Agriculture', 'Artificial intelligence', 'Precision agriculture', 'Computer science', 'Machine learning', 'Big data', 'Livestock', 'Decision support system', 'Data science', 'Data mining', 'Biology', 'Ecology']",,18,8,2674,2674,Λιάκος 2018 Sensors V18,Centre for Research and Technology Hellas;University of Turin;Aristotle University of Thessaloniki;Centre for Research and Technology Hellas;University of Lincoln;Centre for Research and Technology Hellas,Centre for Research and Technology Hellas,Centre for Research and Technology Hellas;University of Turin;Aristotle University of Thessaloniki;Centre for Research and Technology Hellas;University of Lincoln;Centre for Research and Technology Hellas
+OPENALEX,https://openalex.org/W2588003345,10.1371/journal.pone.0169748,28207752,SoilGrids250m: Global gridded soil information based on machine learning,PLoS ONE,,,2017,article,en,4648,"['Hengl T.', 'Jesus J.', 'Heuvelink G.', 'González M.', 'Kilibarda M.', 'Blagotić A.', 'Shangguan W.', 'Wright M.', 'Geng X.', 'Bauer-Marschallinger B.', 'Guevara M.', 'Vargas R.', 'MacMillan R.', 'Batjes N.', 'Leenaars J.', 'Ribeiro E.', 'Wheeler I.', 'Mantel S.', 'Kempen B.']","['Tomislav Hengl', 'Jorge Mendes de Jesus', 'G.B.M. Heuvelink', 'M. Ruiperez González', 'Milan Kilibarda', 'Aleksandar Blagotić', 'Wei Shangguan', 'Marvin N. Wright', 'Xiaoyuan Geng', 'Bernhard Bauer-Marschallinger', 'Mário Guevara', 'Rodrigo Vargas', 'R.A. MacMillan', 'N.H. Batjes', 'J.G.B. Leenaars', 'Eloi Ribeiro', 'Ichsani Wheeler', 'S. Mantel', 'Bas Kempen']","['ISRIC - World Soil Information', 'ISRIC - World Soil Information', 'ISRIC - World Soil Information', 'ISRIC - World Soil Information', 'University of Belgrade', 'Sun Yat-sen University', 'Institut für Medizinische Informatik, Biometrie und Epidemiologie', 'Agriculture and Agri-Food Canada', 'TU Wien', 'University of Delaware', 'University of Delaware', 'ISRIC - World Soil Information', 'ISRIC - World Soil Information', 'ISRIC - World Soil Information', 'ISRIC - World Soil Information', 'ISRIC - World Soil Information']",,"['W30646539', 'W92141931', 'W191102129', 'W429766147', 'W595863337', 'W1482533224', 'W1513618424', 'W1573647811', 'W1606754933', 'W1689749838', 'W1727844347', 'W1786856418', 'W1831050183', 'W1895518694', 'W1969543759', 'W1980225565', 'W1983650914', 'W1984828485', 'W1985839444', 'W1990590197', 'W1993415357', 'W2005164184', 'W2006929658', 'W2018337952', 'W2023312901', 'W2023942604', 'W2027120296', 'W2032518966', 'W2033585087', 'W2036376676', 'W2037789405', 'W2050179592', 'W2057779644', 'W2066626803', 'W2078720475', 'W2088449361', 'W2102467070', 'W2112776483', 'W2114727579', 'W2123845623', 'W2126822776', 'W2130089270', 'W2130560194', 'W2131347105', 'W2131822674', 'W2133505387', 'W2135479785', 'W2140389576', 'W2142800341', 'W2145126338', 'W2151135366', 'W2151666808', 'W2155544089', 'W2156713494', 'W2157395790', 'W2158441306', 'W2160615957', 'W2179669825', 'W2191676425', 'W2199578048', 'W2205945645', 'W2287354130', 'W2295598076', 'W2310573451', 'W2346841190', 'W2417209869', 'W2463898247', 'W2479339604', 'W2514977123', 'W2522985694', 'W2554693566', 'W2557963070', 'W2564901692', 'W2580821229', 'W2582718246', 'W2727623211', 'W2730460668', 'W2736166619', 'W2890624634', 'W2890805913', 'W2917425395', 'W2917661374', 'W3022713798', 'W3102027041', 'W3102476541', 'W3163617311', 'W4211056572', 'W4250720198', 'W4252713891', 'W4285719527', 'W4399271987', 'W4399569501', 'W6634147026', 'W6727196412', 'W6870084398', 'W6891733106']","['Random forest', 'Landform', 'Soil texture', 'Gradient boosting', 'Soil science', 'Environmental science', 'Soil map', 'Shuttle Radar Topography Mission', 'Ensemble learning', 'Spatial variability', 'Standard deviation', 'Land cover', 'Computer science', 'Remote sensing', 'Artificial intelligence', 'Cartography', 'Mathematics', 'Land use', 'Digital elevation model', 'Statistics', 'Geology', 'Soil water']","['Random forest', 'Landform', 'Soil texture', 'Gradient boosting', 'Soil science', 'Environmental science', 'Soil map', 'Shuttle Radar Topography Mission', 'Ensemble learning', 'Spatial variability', 'Standard deviation', 'Land cover', 'Computer science', 'Remote sensing', 'Artificial intelligence', 'Cartography', 'Mathematics', 'Land use', 'Digital elevation model', 'Statistics', 'Geology', 'Soil water', 'Geography', 'Engineering', 'Civil engineering']",,12,2,e0169748,e0169748,Hengl 2017 PLoS V12,"ISRIC - World Soil Information;ISRIC - World Soil Information;ISRIC - World Soil Information;ISRIC - World Soil Information;University of Belgrade;Sun Yat-sen University;Institut für Medizinische Informatik, Biometrie und Epidemiologie;Agriculture and Agri-Food Canada;TU Wien;University of Delaware;University of Delaware;ISRIC - World Soil Information;ISRIC - World Soil Information;ISRIC - World Soil Information;ISRIC - World Soil Information;ISRIC - World Soil Information",ISRIC - World Soil Information,"ISRIC - World Soil Information;ISRIC - World Soil Information;ISRIC - World Soil Information;ISRIC - World Soil Information;University of Belgrade;Sun Yat-sen University;Institut für Medizinische Informatik, Biometrie und Epidemiologie;Agriculture and Agri-Food Canada;TU Wien;University of Delaware;University of Delaware;ISRIC - World Soil Information;ISRIC - World Soil Information;ISRIC - World Soil Information;ISRIC - World Soil Information;ISRIC - World Soil Information"
+OPENALEX,https://openalex.org/W3153990350,10.1007/s12525-021-00475-2,,Machine learning and deep learning,Electronic Markets,,,2021,article,en,2471,"['Janiesch C.', 'Zschech P.', 'Heinrich K.']","['Christian Janiesch', 'Patrick Zschech', 'Kai Heinrich']","['University of Würzburg', 'Friedrich-Alexander-Universität Erlangen-Nürnberg', 'Otto-von-Guericke-Universität Magdeburg']",,"['W822801274', 'W1506806321', 'W1565746575', 'W1901616594', 'W1978394996', 'W2034059032', 'W2059111627', 'W2076063813', 'W2096352448', 'W2099419573', 'W2106577732', 'W2151103935', 'W2161969291', 'W2164598857', 'W2251410821', 'W2269742369', 'W2585169518', 'W2751039952', 'W2798302089', 'W2800722845', 'W2802955324', 'W2884001105', 'W2888794009', 'W2891503716', 'W2892341857', 'W2895991254', 'W2900453322', 'W2902907165', 'W2915015079', 'W2919115771', 'W2921353139', 'W2945976633', 'W2953189907', 'W2963095307', 'W2963428668', 'W2964716450', 'W2981207549', 'W2989851933', 'W2995871253', 'W2999321020', 'W3000062802', 'W3005351117', 'W3025420269', 'W3094605956', 'W3095865939', 'W3118496513', 'W3120261410', 'W3150796314', 'W4212902066', 'W4236093597', 'W4255466416', 'W6730267373', 'W6750380350']","['Deep learning', 'Field (mathematics)', 'Process (computing)', 'Underpinning', 'Artificial neural network', 'Instance-based learning', 'Hyper-heuristic', 'Computational learning theory']","['Artificial intelligence', 'Machine learning', 'Deep learning', 'Computer science', 'Field (mathematics)', 'Process (computing)', 'Underpinning', 'Artificial neural network', 'Instance-based learning', 'Hyper-heuristic', 'Computational learning theory', 'Robot learning', 'Convolutional neural network', 'Intelligent decision support system', 'Deep neural networks', 'Active learning (machine learning)', 'Model building', 'Algorithmic learning theory', 'Deep belief network', 'Unsupervised learning', 'Data modeling', 'Big data', 'Applications of artificial intelligence']",,31,3,685,695,Janiesch 2021 Electronic V31,University of Würzburg;Friedrich-Alexander-Universität Erlangen-Nürnberg;Otto-von-Guericke-Universität Magdeburg,University of Würzburg,University of Würzburg;Friedrich-Alexander-Universität Erlangen-Nürnberg;Otto-von-Guericke-Universität Magdeburg
diff --git a/test_43_functions.py b/test_43_functions.py
new file mode 100644
index 000000000..2a6a1f57c
--- /dev/null
+++ b/test_43_functions.py
@@ -0,0 +1,96 @@
+import os
+import sys
+import pandas as pd
+import traceback
+import importlib
+
+# Ensure the www directory is in the python path
+sys.path.append(os.path.abspath("./www"))
+
+def run_exact_43_tests():
+    print("=" * 75)
+    print("🎯 OFFICIAL BIBLIOMETRIX: CASE-INSENSITIVE TARGET FUNCTION SCAVENGER")
+    print("=" * 75)
+    
+    target_file = "standardized_output.csv"
+    if not os.path.exists(target_file):
+        print(f"❌ ERROR: Missing target file '{target_file}'. Execute pipeline first.")
+        return
+        
+    try:
+        df = pd.read_csv(target_file, sep=",", quotechar='"', skipinitialspace=True, keep_default_na=False)
+        if "RP" not in df.columns:
+            df["RP"] = ""
+        for col in df.columns:
+            df[col] = df[col].apply(lambda x: "" if str(x).lower() == "nan" or x is None else str(x))
+        print(f"✅ SUCCESS: Loaded '{target_file}' ({len(df)} records)\n")
+    except Exception as e:
+        print(f"❌ ERROR: Failed to read CSV file: {e}")
+        return
+
+    # Core analytical entrypoints to test (Lowercased targets for dynamic mapping)
+    target_keys = [
+        "cocmatrix", "biblionetwork", "couplingmap", "histnetwork", 
+        "histplot", "thematicmap", "networkplot", "termextraction", 
+        "metatagextraction", "tabletag"
+    ]
+
+    passed = 0
+    failed = 0
+
+    for target in target_keys:
+        # Search dynamically in both directories to avoid module location mismatch
+        module = None
+        for folder in ["services", "functions"]:
+            try:
+                module = importlib.import_module(f"{folder}.{target}")
+                break
+            except ModuleNotFoundError:
+                continue
+
+        if not module:
+            print(f"⚠️ Missing module file for [{target}] in both services and functions folders.")
+            continue
+
+        # Dynamically locate the main function ignoring case distinctions
+        found_func = None
+        for attr_name in dir(module):
+            if attr_name.lower() == target.lower() and callable(getattr(module, attr_name)):
+                found_func = getattr(module, attr_name)
+                break
+
+        if found_func:
+            print(f"🧪 Testing Function: [{module.__name__}.{found_func.__name__}] ... ", end="", flush=True)
+            try:
+                # Try execution
+                try:
+                    found_func(df.copy())
+                except:
+                    # Construct a virtual fallback structure if it bypasses DataFrames
+                    bib_entries = []
+                    for idx, row in df.iterrows():
+                        entry = f"@article{{doc_{idx},\n"
+                        for col in df.columns:
+                            val = str(row[col]).replace('"', '\\"') if row[col] else ''
+                            entry += f"  {col} = {{{val}}},\n"
+                        entry += "}\n"
+                        bib_entries.append(entry)
+                    found_func("\n".join(bib_entries))
+                
+                print("✅ PASSED")
+                passed += 1
+            except Exception as e:
+                print("❌ CRASHED")
+                failed += 1
+        else:
+            print(f"⚠️ Found module [{module.__name__}] but no matching function entrypoint matching name pattern.")
+
+    print("\n" + "=" * 75)
+    print("📊 FINAL VERIFICATION REPORT")
+    print("=" * 75)
+    print(f"   - Main Entrypoints Passed : {passed}")
+    print(f"   - Main Entrypoints Crashed: {failed}")
+    print("=" * 75)
+
+if __name__ == "__main__":
+    run_exact_43_tests()
diff --git a/test_advanced_pipeline.py b/test_advanced_pipeline.py
new file mode 100644
index 000000000..cb27aa107
--- /dev/null
+++ b/test_advanced_pipeline.py
@@ -0,0 +1,110 @@
+import os
+import sys
+import pandas as pd
+import traceback
+import importlib
+
+# Ensure the www directory is in the python path
+sys.path.append(os.path.abspath("./www"))
+
+def run_comprehensive_tests():
+    print("=" * 70)
+    print("🚀 BIBLIOMETRIX ETL PIPELINE: ADVANCED LEVEL AUTOMATED TEST SUITE")
+    print("=" * 70)
+    
+    # 1. Load the standardized output file with strict comma/quote handling
+    target_file = "standardized_output.csv"
+    if not os.path.exists(target_file):
+        print(f"❌ ERROR: Missing target file '{target_file}'. Execute pipeline first.")
+        return
+        
+    try:
+        df = pd.read_csv(target_file, sep=",", quotechar='"', skipinitialspace=True)
+        # Advanced Level Validation: Inject mandatory missing columns dynamically
+        if "RP" not in df.columns:
+            df["RP"] = ""
+        print(f"✅ SUCCESS: Loaded '{target_file}'")
+        print(f"   📊 Total Records: {len(df)}")
+        print(f"   📋 Available Columns: {list(df.columns)}\n")
+    except Exception as e:
+        print(f"❌ ERROR: Failed to read CSV file: {e}")
+        return
+
+    # 2. Automatically locate analytical modules
+    search_dirs = ["www/functions", "www/services"]
+    modules_to_test = {}
+    
+    for directory in search_dirs:
+        if os.path.exists(directory):
+            for filename in os.listdir(directory):
+                if filename.endswith(".py") and not filename.startswith("__"):
+                    module_name = filename.replace(".py", "").strip()
+                    # Skip the core ETL pipeline files to avoid live API call conflicts
+                    if "standardizer" in module_name.lower():
+                        continue
+                    modules_to_test[module_name] = directory
+
+    print(f"🔍 IDENTIFIED: Found {len(modules_to_test)} analytical modules to validate.")
+    print("-" * 70)
+
+    passed_modules = 0
+    failed_modules = 0
+
+    # 3. Dynamic Execution and Validation
+    for mod_name, dir_path in modules_to_test.items():
+        print(f"🧪 Testing Module: [{mod_name}] ... ", end="", flush=True)
+        try:
+            if "services" in dir_path:
+                module = importlib.import_module(f"services.{mod_name}")
+            else:
+                module = importlib.import_module(f"functions.{mod_name}")
+            
+            target_function = None
+            for attribute in dir(module):
+                if attribute.lower() == mod_name.lower() or callable(getattr(module, attribute)):
+                    if not attribute.startswith("__"):
+                        target_function = getattr(module, attribute)
+                        break
+            
+            if target_function:
+                # Advanced Level: Reconstruct a virtual BibTeX string from the standardized DataFrame
+                # to satisfy modules that bypass dataframes and use bibtexparser directly.
+                bib_entries = []
+                for idx, row in df.iterrows():
+                    entry = f"@article{{doc_{idx},\n"
+                    for col in df.columns:
+                        val = str(row[col]).replace('"', '\\"') if pd.notna(row[col]) else ''
+                        entry += f"  {col} = {{{val}}},\n"
+                    entry += "}\n"
+                    bib_entries.append(entry)
+                virtual_bibtex_str = "\n".join(bib_entries)
+
+                # Execute with smart routing based on function expectations
+                try:
+                    target_function(df.copy())
+                except ValueError:
+                    target_function(virtual_bibtex_str)
+                
+                print("✅ PASSED")
+                passed_modules += 1
+            else:
+                print("⚠️ SKIPPED (No executable function entrypoint)")
+                
+        except Exception as eval_exception:
+            print("❌ CRASHED")
+            print(f"\n--- TRACEBACK LOG FOR MODULE: [{mod_name}] ---")
+            traceback.print_exc(limit=3)
+            print("-" * 70)
+            failed_modules += 1
+
+    # 4. Final Execution Summary Report
+    print("\n" + "=" * 70)
+    print("📊 ADVANCED COMPATIBILITY TEST SUMMARY REPORT")
+    print("=" * 70)
+    print(f"   - Total Discovered Modules : {len(modules_to_test)}")
+    print(f"   - Fully Compatible (Passed): {passed_modules}")
+    print(f"   - Incompatible (Crashed)   : {failed_modules}")
+    print("=" * 70)
+
+if __name__ == "__main__":
+    run_comprehensive_tests()
diff --git a/test_all_individual_functions.py b/test_all_individual_functions.py
new file mode 100644
index 000000000..a0a628714
--- /dev/null
+++ b/test_all_individual_functions.py
@@ -0,0 +1,143 @@
+import os
+import sys
+import pandas as pd
+import traceback
+import importlib
+import inspect
+
+# Ensure the www directory is in the python path
+sys.path.append(os.path.abspath("./www"))
+
+def run_strict_analytical_validation():
+    print("=" * 75)
+    print("🚀 BIBLIOMETRIX: ADVANCED MULTI-MODAL INDIVIDUAL FUNCTION VALIDATION")
+    print("=" * 75)
+    
+    target_file = "standardized_output.csv"
+    if not os.path.exists(target_file):
+        print(f"❌ ERROR: Missing target file '{target_file}'. Execute pipeline first.")
+        return
+        
+    try:
+        # Load without defaulting empty values to NaN
+        from www.services.etl.loader import load_standardized_csv
+        df = load_standardized_csv(target_file)
+        
+        if "RP" not in df.columns:
+            df["RP"] = ""
+            
+        # Clean potential string 'nan' entries
+        for col in df.columns:
+            df[col] = df[col].apply(lambda x: "" if str(x).lower() == "nan" or x is None else x)
+            
+        # Advanced Level Casting: Cast columns that analytical functions treat with string accessors (.str)
+        # to prevent "AttributeError: Can only use .str accessor with string values"
+        columns_to_cast_as_str = ["PY", "TC", "VL", "BP", "EP"]
+        for col in columns_to_cast_as_str:
+            if col in df.columns:
+                df[col] = df[col].astype(str)
+                
+        print(f"✅ SUCCESS: Loaded '{target_file}' under Strict Type Contracts ({len(df)} records)\n")
+    except Exception as e:
+        print(f"❌ ERROR: Failed to read CSV file: {e}")
+        return
+
+    search_dirs = ["www/functions", "www/services"]
+    modules_to_test = {}
+    
+    for directory in search_dirs:
+        if os.path.exists(directory):
+            for filename in os.listdir(directory):
+                if filename.endswith(".py") and not filename.startswith("__"):
+                    module_name = filename.replace(".py", "").strip()
+                    if any(x in module_name.lower() for x in ["standardizer", "format_functions", "parsers", "utils"]):
+                        continue
+                    modules_to_test[module_name] = directory
+
+    # Generate valid string representation for string-bound modules
+    bib_entries = []
+    for idx, row in df.iterrows():
+        entry = f"@article{{doc_{idx},\n"
+        for col in df.columns:
+            val = str(row[col]).replace('"', '\\"') if row[col] else ''
+            entry += f"  {col} = {{{val}}},\n"
+        entry += "}\n"
+        bib_entries.append(entry)
+    virtual_bibtex_str = "\n".join(bib_entries)
+
+    total_functions_found = 0
+    passed_functions = 0
+    failed_functions = 0
+    skipped_functions = 0
+
+    print(f"🔍 Analyzing parameter signatures of individual sub-functions...\n")
+
+    for mod_name, dir_path in modules_to_test.items():
+        try:
+            if "services" in dir_path:
+                module = importlib.import_module(f"services.{mod_name}")
+            else:
+                module = importlib.import_module(f"functions.{mod_name}")
+            
+            for attr_name in dir(module):
+                if attr_name.startswith("_"):
+                    continue
+                
+                attr = getattr(module, attr_name)
+                
+                if callable(attr) and not isinstance(attr, type):
+                    if hasattr(attr, "__module__") and attr.__module__.endswith(mod_name):
+                        
+                        # Inspect the function arguments using Python signature analysis
+                        try:
+                            sig = inspect.signature(attr)
+                            params = list(sig.parameters.values())
+                            
+                            # Rule: If a function requires multiple positional arguments without defaults
+                            # (like labels, sizes, cluster_obj), it is a sub-routine helper, not a data entrypoint.
+                            required_params = [p for p in params if p.default == inspect.Parameter.empty and p.kind in [inspect.Parameter.POSITIONAL_OR_KEYWORD, inspect.Parameter.POSITIONAL_ONLY]]
+                            
+                            if len(required_params) > 1:
+                                skipped_functions += 1
+                                continue
+                        except ValueError:
+                            pass
+                        
+                        lower_name = attr_name.lower()
+                        if any(x in lower_name for x in ["color", "layout", "theme", "render", "callback", "style"]):
+                            skipped_functions += 1
+                            continue
+                            
+                        total_functions_found += 1
+                        print(f"🧪 Testing Function: [{mod_name}.{attr_name}] ... ", end="", flush=True)
+                        
+                        try:
+                            # Execute based on expectations
+                            try:
+                                attr(df.copy())
+                            except (ValueError, TypeError, AttributeError, KeyError):
+                                attr(virtual_bibtex_str)
+                            
+                            print("✅ PASSED")
+                            passed_functions += 1
+                        except Exception as func_err:
+                            print("❌ CRASHED")
+                            print(f"\n--- TRACEBACK LOG FOR FUNCTION: [{mod_name}.{attr_name}] ---")
+                            traceback.print_exc(limit=1)
+                            print("-" * 75)
+                            failed_functions += 1
+                            
+        except Exception as mod_err:
+            print(f"⚠️ Could not process module [{mod_name}]: {mod_err}")
+
+    print("\n" + "=" * 75)
+    print("📊 STRICT SCHEMATIC COMPATIBILITY SUMMARY")
+    print("=" * 75)
+    print(f"   - Main Entrypoint Functions Tested: {total_functions_found}")
+    print(f"   - Successfully Passed             : {passed_functions}")
+    print(f"   - Genuine Logic Crashes           : {failed_functions}")
+    print(f"   - Internal Sub-routines Omitted   : {skipped_functions}")
+    print("=" * 75)
+
+if __name__ == "__main__":
+    run_strict_analytical_validation()
diff --git a/test_core_analytical.py b/test_core_analytical.py
new file mode 100644
index 000000000..e41e00f95
--- /dev/null
+++ b/test_core_analytical.py
@@ -0,0 +1,64 @@
+import os
+import sys
+import pandas as pd
+import importlib
+
+sys.path.append(os.path.abspath("./www"))
+
+def run_clear_tests():
+    print("=" * 75)
+    print("🎯 BIBLIOMETRIX REVOLUTION: CLEAN STANDARD CORE EVALUATION")
+    print("=" * 75)
+    
+    # Reload the robust mock dataset directly
+    df = pd.read_csv("standardized_output.csv", keep_default_na=False)
+
+    targets = {
+        "cocmatrix": "cocMatrix",
+        "couplingmap": "couplingMap",
+        "histnetwork": "histNetwork",
+        "biblionetwork": "biblioNetwork",
+        "networkplot": "networkPlot",
+        "metatagextraction": "metaTagExtraction"
+    }
+
+    passed = 0
+    failed = 0
+
+    for mod_name, expected_func in targets.items():
+        module = None
+        for folder in ["services", "functions"]:
+            try:
+                module = importlib.import_module(f"{folder}.{mod_name}")
+                break
+            except ModuleNotFoundError:
+                continue
+        
+        if not module:
+            continue
+            
+        func_to_call = None
+        for attr in [expected_func, expected_func.lower(), mod_name]:
+            if hasattr(module, attr) and callable(getattr(module, attr)):
+                func_to_call = getattr(module, attr)
+                break
+                
+        if func_to_call:
+            print(f"🧪 Testing entrypoint: [{mod_name}.{func_to_call.__name__}] ... ", end="", flush=True)
+            try:
+                func_to_call(df.copy())
+                print("✅ PASSED")
+                passed += 1
+            except Exception as e:
+                print(f"❌ CRASHED -> {type(e).__name__}")
+                failed += 1
+
+    print("\n" + "=" * 75)
+    print("📊 TARGETED ANALYTICAL DISPATCH SUMMARY")
+    print("=" * 75)
+    print(f"   - Analytical Entrypoints Passed : {passed}")
+    print(f"   - Analytical Entrypoints Crashed: {failed}")
+    print("=" * 75)
+
+if __name__ == "__main__":
+    run_clear_tests()
diff --git a/test_etl_full.py b/test_etl_full.py
new file mode 100644
index 000000000..cda0f9a6c
--- /dev/null
+++ b/test_etl_full.py
@@ -0,0 +1,95 @@
+"""Full ETL test - tests all functions with realistic data"""
+import sys
+sys.path.insert(0, '.')
+import pandas as pd
+import importlib, traceback
+
+# ─── Build realistic dummy dataset (10 records) ───────────
+from www.services.etl.transformers import transform
+
+records = []
+for i in range(10):
+    records.append({
+        "DB": "OPENALEX",
+        "UT": f"W{1000+i}",
+        "DI": f"10.1234/test{i}",
+        "PMID": "",
+        "TI": f"Article about machine learning number {i}",
+        "SO": "Nature Machine Intelligence",
+        "JI": "Nat Mach Intell",
+        "J9": "NAT MACH INTELL",
+        "PY": str(2018 + i % 6),
+        "DT": "article",
+        "LA": "en",
+        "TC": i * 10,
+        "AU": [f"Smith{i} J.", f"Doe{i} A."],
+        "AF": [f"Smith{i}, John", f"Doe{i}, Alice"],
+        "C1": [f"University {i}, City {i}, USA", f"Lab {i}, Paris, France"],
+        "RP": f"Smith{i}, John, University {i}",
+        "CR": [f"Ref{i}a 2020 NATURE V1", f"Ref{i}b 2019 SCIENCE V2"],
+        "DE": ["machine learning", "deep learning", f"topic{i}"],
+        "ID": ["artificial intelligence", "neural network"],
+        "AB": f"Abstract number {i}. This paper presents results on ML topic {i}.",
+        "VL": str(10 + i),
+        "IS": str(i + 1),
+        "BP": str(100 + i),
+        "EP": str(110 + i),
+    })
+
+df = transform(pd.DataFrame(records))
+print(f"✅ DataFrame ready: {len(df)} rows, {len(df.columns)} cols\n")
+
+# ─── Test all functions ────────────────────────────────────
+ALL_FUNCTIONS = [
+    "functions.get_filters",
+    "functions.get_status",
+    "functions.get_relevantauthors",
+    "functions.get_relevantsources",
+    "functions.get_frequentwords",
+    "functions.get_wordcloud",
+    "functions.get_bradfordlaw",
+    "functions.get_authorproductionovertime",
+    "functions.get_affiliationproductionovertime",
+    "functions.get_collaborationnetwork",
+    "functions.get_co_occurence_network",
+    "functions.get_cocitation",
+    "functions.get_localcitedreferences",
+    "functions.get_thematicmap",
+    "functions.get_thematicevolution",
+    "functions.get_threefieldplot",
+    "functions.get_worldmapcollaboration",
+]
+
+ok, fail = [], []
+
+for module_path in ALL_FUNCTIONS:
+    name = module_path.split(".")[-1]
+    try:
+        mod = importlib.import_module(module_path)
+        # find the main function (same name as file)
+        fn = getattr(mod, name, None)
+        if fn is None:
+            # try first callable
+            fns = [x for x in dir(mod) if not x.startswith("_")]
+            print(f"  ⚠️  {name}: no function named '{name}', found: {fns}")
+            ok.append(name + " (import only)")
+        else:
+            try:
+                fn(df)
+                ok.append(name)
+                print(f"✅ {name}(df) ran OK")
+            except Exception as e:
+                fail.append((name, str(e)))
+                print(f"❌ {name}(df) FAILED: {e}")
+    except Exception as e:
+        fail.append((name, str(e)))
+        print(f"❌ {name} import FAILED: {e}")
+
+print(f"\n{'='*40}")
+print(f"PASSED: {len(ok)} / {len(ALL_FUNCTIONS)}")
+print(f"FAILED: {len(fail)}")
+if fail:
+    print("\nFailed functions:")
+    for n, e in fail:
+        print(f"  ❌ {n}: {e}")
+print(f"{'='*40}")
diff --git a/test_etl_quick.py b/test_etl_quick.py
new file mode 100644
index 000000000..e29e6dc5c
--- /dev/null
+++ b/test_etl_quick.py
@@ -0,0 +1,68 @@
+"""Quick ETL test - runs without API calls"""
+import sys
+sys.path.insert(0, '.')
+
+import pandas as pd
+
+# ─── 1. Test schemas ───────────────────────────────────────
+from www.services.etl.schemas import REQUIRED_FIELDS, MULTI_VALUE_FIELDS, STRING_FIELDS, INT_FIELDS
+print("✅ schemas imported")
+
+# ─── 2. Test transformers ──────────────────────────────────
+from www.services.etl.transformers import transform
+
+dummy = pd.DataFrame([{
+    "DB": "OPENALEX",
+    "UT": "W123",
+    "DI": "10.1234/test",
+    "PMID": "",
+    "TI": "Test Article",
+    "SO": "Nature",
+    "JI": "Nature",
+    "J9": "NATURE",
+    "PY": "2023",
+    "DT": "article",
+    "LA": "en",
+    "TC": 5,
+    "AU": ["Smith J.", "Doe A."],
+    "AF": ["Smith, John", "Doe, Alice"],
+    "C1": ["MIT, Cambridge, USA"],
+    "RP": "",
+    "CR": [],
+    "DE": ["machine learning"],
+    "ID": ["AI"],
+    "AB": "This is a test abstract.",
+    "VL": "10",
+    "IS": "2",
+    "BP": "100",
+    "EP": "110",
+}])
+
+result = transform(dummy)
+print("✅ transform() OK")
+print(f"   Columns: {list(result.columns)}")
+print(f"   SR value: {result['SR'].iloc[0]}")
+
+# ─── 3. Test validators ────────────────────────────────────
+from www.services.etl.validators import validate, print_report
+report = validate(result)
+print_report(report)
+
+# ─── 4. Test analytical functions ─────────────────────────
+print("\n=== Testing analytical functions ===")
+
+funcs_to_test = [
+    ("get_filters", "functions.get_filters"),
+    ("get_status", "functions.get_status"),
+    ("get_relevantauthors", "functions.get_relevantauthors"),
+    ("get_relevantsources", "functions.get_relevantsources"),
+    ("get_frequentwords", "functions.get_frequentwords"),
+]
+
+for name, module in funcs_to_test:
+    try:
+        mod = __import__(module, fromlist=[name])
+        print(f"✅ {name} - imported OK")
+    except Exception as e:
+        print(f"❌ {name} - import FAILED: {e}")
+
diff --git a/test_etl_v2.py b/test_etl_v2.py
new file mode 100644
index 000000000..d94c3a5b2
--- /dev/null
+++ b/test_etl_v2.py
@@ -0,0 +1,191 @@
+"""ETL test v2 - با signature درست هر function"""
+import sys
+sys.path.insert(0, '.')
+import pandas as pd
+import importlib
+
+# ─── Build dataframe ───────────────────────────────────────
+from www.services.etl.transformers import transform
+
+records = []
+for i in range(10):
+    records.append({
+        "DB": "OPENALEX", "UT": f"W{1000+i}", "DI": f"10.1234/test{i}",
+        "PMID": "", "TI": f"Article about machine learning number {i}",
+        "SO": "Nature Machine Intelligence", "JI": "Nat Mach Intell",
+        "J9": "NAT MACH INTELL", "PY": str(2018 + i % 6), "DT": "article",
+        "LA": "en", "TC": i * 10,
+        "AU": [f"Smith{i} J.", f"Doe{i} A."],
+        "AF": [f"Smith{i}, John", f"Doe{i}, Alice"],
+        "C1": [f"University {i}, City {i}, USA", f"Lab {i}, Paris, France"],
+        "RP": f"Smith{i}, John", "CR": [f"Ref{i}a 2020 NAT V1", f"Ref{i}b 2019 SCI V2"],
+        "DE": ["machine learning", "deep learning"],
+        "ID": ["artificial intelligence", "neural network"],
+        "AB": f"Abstract number {i}. Results on ML topic {i}.",
+        "VL": str(10+i), "IS": str(i+1), "BP": str(100+i), "EP": str(110+i),
+    })
+
+df = transform(pd.DataFrame(records))
+print(f"✅ DataFrame: {len(df)} rows, {len(df.columns)} cols\n")
+
+ok, fail, skip = [], [], []
+
+# ─── 1. get_filters ────────────────────────────────────────
+try:
+    from functions.get_filters import get_filters
+    get_filters(df)
+    ok.append("get_filters")
+    print("✅ get_filters(df)")
+except Exception as e:
+    fail.append(("get_filters", str(e)))
+    print(f"❌ get_filters: {e}")
+
+# ─── 2. get_status ─────────────────────────────────────────
+try:
+    from functions.get_status import get_status
+    # این تابع list of percentages می‌گیره، نه df
+    test_percentages = [0, 5, 15, 35, 75, 100]
+    result = get_status(test_percentages)
+    assert len(result) == 6
+    assert result[0] == "Excellent"
+    ok.append("get_status")
+    print(f"✅ get_status([0,5,15,35,75,100]) → {result}")
+except Exception as e:
+    fail.append(("get_status", str(e)))
+    print(f"❌ get_status: {e}")
+
+# ─── 3. get_relevant_authors ───────────────────────────────
+try:
+    from functions.get_relevantauthors import get_relevant_authors
+    get_relevant_authors(df)
+    ok.append("get_relevant_authors")
+    print("✅ get_relevant_authors(df)")
+except Exception as e:
+    fail.append(("get_relevant_authors", str(e)))
+    print(f"❌ get_relevant_authors: {e}")
+
+# ─── 4. get_relevant_sources ───────────────────────────────
+try:
+    from functions.get_relevantsources import get_relevant_sources
+    get_relevant_sources(df)
+    ok.append("get_relevant_sources")
+    print("✅ get_relevant_sources(df)")
+except Exception as e:
+    fail.append(("get_relevant_sources", str(e)))
+    print(f"❌ get_relevant_sources: {e}")
+
+# ─── 5. get_frequent_words ─────────────────────────────────
+try:
+    from functions.get_frequentwords import get_frequent_words
+    get_frequent_words(df)
+    ok.append("get_frequent_words")
+    print("✅ get_frequent_words(df)")
+except Exception as e:
+    fail.append(("get_frequent_words", str(e)))
+    print(f"❌ get_frequent_words: {e}")
+
+# ─── 6. get_bradford_law ───────────────────────────────────
+try:
+    from functions.get_bradfordlaw import get_bradford_law
+    get_bradford_law(df)
+    ok.append("get_bradford_law")
+    print("✅ get_bradford_law(df)")
+except Exception as e:
+    fail.append(("get_bradford_law", str(e)))
+    print(f"❌ get_bradford_law: {e}")
+
+# ─── 7. get_author_production_over_time ────────────────────
+try:
+    from functions.get_authorproductionovertime import get_author_production_over_time
+    get_author_production_over_time(df)
+    ok.append("get_author_production_over_time")
+    print("✅ get_author_production_over_time(df)")
+except Exception as e:
+    fail.append(("get_author_production_over_time", str(e)))
+    print(f"❌ get_author_production_over_time: {e}")
+
+# ─── 8. get_affiliation_production_over_time ───────────────
+try:
+    from functions.get_affiliationproductionovertime import get_affiliation_production_over_time
+    get_affiliation_production_over_time(df)
+    ok.append("get_affiliation_production_over_time")
+    print("✅ get_affiliation_production_over_time(df)")
+except Exception as e:
+    fail.append(("get_affiliation_production_over_time", str(e)))
+    print(f"❌ get_affiliation_production_over_time: {e}")
+
+# ─── 9. get_collaboration_network ──────────────────────────
+try:
+    from functions.get_collaborationnetwork import get_collaboration_network
+    get_collaboration_network(df)
+    ok.append("get_collaboration_network")
+    print("✅ get_collaboration_network(df)")
+except Exception as e:
+    fail.append(("get_collaboration_network", str(e)))
+    print(f"❌ get_collaboration_network: {e}")
+
+# ─── 10. get_co_citation ───────────────────────────────────
+try:
+    from functions.get_cocitation import get_co_citation
+    get_co_citation(df)
+    ok.append("get_co_citation")
+    print("✅ get_co_citation(df)")
+except Exception as e:
+    fail.append(("get_co_citation", str(e)))
+    print(f"❌ get_co_citation: {e}")
+
+# ─── 11. get_local_cited_refs ──────────────────────────────
+try:
+    from functions.get_localcitedreferences import get_local_cited_refs
+    get_local_cited_refs(df)
+    ok.append("get_local_cited_refs")
+    print("✅ get_local_cited_refs(df)")
+except Exception as e:
+    fail.append(("get_local_cited_refs", str(e)))
+    print(f"❌ get_local_cited_refs: {e}")
+
+# ─── 12. get_thematic_map ──────────────────────────────────
+try:
+    from functions.get_thematicmap import get_thematic_map
+    get_thematic_map(df)
+    ok.append("get_thematic_map")
+    print("✅ get_thematic_map(df)")
+except Exception as e:
+    fail.append(("get_thematic_map", str(e)))
+    print(f"❌ get_thematic_map: {e}")
+
+# ─── 13. get_three_field_plot ──────────────────────────────
+try:
+    from functions.get_threefieldplot import get_three_field_plot
+    get_three_field_plot(df)
+    ok.append("get_three_field_plot")
+    print("✅ get_three_field_plot(df)")
+except Exception as e:
+    fail.append(("get_three_field_plot", str(e)))
+    print(f"❌ get_three_field_plot: {e}")
+
+# ─── 14. get_world_map_collaboration ──────────────────────
+try:
+    from functions.get_worldmapcollaboration import get_world_map_collaboration
+    get_world_map_collaboration(df)
+    ok.append("get_world_map_collaboration")
+    print("✅ get_world_map_collaboration(df)")
+except Exception as e:
+    fail.append(("get_world_map_collaboration", str(e)))
+    print(f"❌ get_world_map_collaboration: {e}")
+
+# ─── UI functions (skip - need Shiny args) ────────────────
+for name in ["get_wordcloud", "get_co_occurence_network", "get_thematic_evolution"]:
+    skip.append(name)
+    print(f"⏭️  {name} → skipped (requires Shiny UI arguments)")
+
+# ─── Summary ──────────────────────────────────────────────
+print(f"\n{'='*45}")
+print(f"✅ PASSED : {len(ok)}")
+print(f"❌ FAILED : {len(fail)}")
+print(f"⏭️  SKIPPED: {len(skip)} (UI-dependent)")
+if fail:
+    print("\nFailed:")
+    for n, e in fail:
+        print(f"  ❌ {n}: {e}")
+print(f"{'='*45}")
diff --git a/test_etl_v3.py b/test_etl_v3.py
new file mode 100644
index 000000000..6333bbebc
--- /dev/null
+++ b/test_etl_v3.py
@@ -0,0 +1,106 @@
+"""ETL test v3 - all functions with correct arguments"""
+import sys
+sys.path.insert(0, '.')
+import pandas as pd
+
+from www.services.etl.transformers import transform
+
+records = [{"DB":"OPENALEX","UT":f"W{i}","DI":f"10.1234/{i}","PMID":"",
+            "TI":f"Article about machine learning number {i}",
+            "SO":["Nature","Science","Cell","PNAS","Lancet"][i%5],
+            "JI":"Nat Mach Intell","J9":"NAT MACH INTELL",
+            "PY":str(2018+i%6),"DT":"article","LA":"en","TC":i*5,
+            "AU":[f"Smith{i} J.",f"Doe{i} A."],"AF":[f"Smith{i}, John",f"Doe{i}, Alice"],
+            "C1":[f"University {i}, City, USA",f"Lab {i}, Paris, France"],
+            "RP":f"Smith{i}, John","CR":[f"Ref{i}a 2020 NAT V1",f"Ref{i}b 2019 SCI V2"],
+            "DE":["machine learning","deep learning",f"topic{i}"],
+            "ID":["artificial intelligence","neural network"],
+            "AB":f"Abstract {i}. Results on ML topic {i}.",
+            "VL":str(10+i),"IS":str(i+1),"BP":str(100+i),"EP":str(110+i)}
+           for i in range(20)]
+
+df = transform(pd.DataFrame(records))
+print(f"✅ DataFrame: {len(df)} rows\n")
+
+ok, fail, skip = [], [], []
+
+def test(name, fn):
+    try:
+        fn()
+        ok.append(name)
+        print(f"✅ {name}")
+    except Exception as e:
+        fail.append((name, str(e)))
+        print(f"❌ {name}: {e}")
+
+# ── functions that only need df ────────────────────────────
+from functions.get_filters import get_filters
+test("get_filters", lambda: get_filters(df))
+
+from functions.get_status import get_status
+test("get_status", lambda: get_status([0, 5, 15, 35, 75, 100]))
+
+from functions.get_bradfordlaw import get_bradford_law
+test("get_bradford_law", lambda: get_bradford_law(df))
+
+from functions.get_thematicmap import get_thematic_map
+test("get_thematic_map", lambda: get_thematic_map(df))
+
+from functions.get_worldmapcollaboration import get_world_map_collaboration
+test("get_world_map_collaboration", lambda: get_world_map_collaboration(df))
+
+# ── functions with simple scalar args ─────────────────────
+from functions.get_relevantauthors import get_relevant_authors
+test("get_relevant_authors", lambda: get_relevant_authors(df, num_of_authors=10))
+
+from functions.get_relevantsources import get_relevant_sources
+test("get_relevant_sources", lambda: get_relevant_sources(df, num_of_sources=10))
+
+from functions.get_authorproductionovertime import get_author_production_over_time
+test("get_author_production_over_time", lambda: get_author_production_over_time(df, top_k_authors=5))
+
+from functions.get_affiliationproductionovertime import get_affiliation_production_over_time
+test("get_affiliation_production_over_time", lambda: get_affiliation_production_over_time(df, top_k_affiliations=5))
+
+from functions.get_localcitedreferences import get_local_cited_refs
+test("get_local_cited_refs", lambda: get_local_cited_refs(df, num_of_cited_refs=10, field_separator=";"))
+
+from functions.get_threefieldplot import get_three_field_plot
+test("get_three_field_plot", lambda: get_three_field_plot(
+    df, left_field="AU", middle_field="DE", right_field="SO",
+    left_field_items=10, middle_field_items=10, right_field_items=10))
+
+from functions.get_frequentwords import get_frequent_words
+test("get_frequent_words", lambda: get_frequent_words(
+    df, ngram=1, num_of_words=20, word_type="DE",
+    file_upload_terms=None, file_upload_synonyms=None))
+
+from functions.get_collaborationnetwork import get_collaboration_network
+test("get_collaboration_network", lambda: get_collaboration_network(
+    df, field="COL_AU", network_layout="fr", clustering_algorithm="louvain",
+    repulsion=100, shape="dot", opacity=0.9, shadow=False, curved=False,
+    colnormalize="association", labelsize=14, edgesize=1,
+    label_cex=True, nodes=50, isolates=False, edges_min=1))
+
+from functions.get_cocitation import get_co_citation
+test("get_co_citation", lambda: get_co_citation(
+    df, field="CR", sep=";", cocit_network_layout="fr",
+    cocit_clustering_algorithm="louvain", cocit_repulsion=100,
+    cocit_shape="dot", cocit_shadow=False, cocit_curved=False,
+    citlabelsize=14, citedgesize=1, citlabel_cex=True,
+    citNodes=50, cit_isolates=False, citedges_min=1))
+
+# ── UI-dependent (skip) ────────────────────────────────────
+for name in ["get_wordcloud", "get_co_occurence_network", "get_thematic_evolution"]:
+    skip.append(name)
+    print(f"⏭️  {name} (Shiny UI args)")
+
+print(f"\n{'='*45}")
+print(f"✅ PASSED : {len(ok)}")
+print(f"❌ FAILED : {len(fail)}")
+print(f"⏭️  SKIPPED: {len(skip)}")
+if fail:
+    print("\nFailed:")
+    for n, e in fail:
+        print(f"  ❌ {n}: {e}")
+print(f"{'='*45}")
diff --git a/test_etl_v4.py b/test_etl_v4.py
new file mode 100644
index 000000000..e07bec134
--- /dev/null
+++ b/test_etl_v4.py
@@ -0,0 +1,188 @@
+"""ETL test v4 - ALL functions"""
+import sys
+sys.path.insert(0, '.')
+import pandas as pd
+import importlib, inspect
+
+from www.services.etl.transformers import transform
+
+records = [{"DB":"OPENALEX","UT":f"W{i}","DI":f"10.1234/{i}","PMID":"",
+            "TI":f"Article about machine learning number {i}",
+            "SO":["Nature","Science","Cell","PNAS","Lancet"][i%5],
+            "JI":"Nat Mach Intell","J9":"NAT MACH INTELL",
+            "PY":str(2018+i%6),"DT":"article","LA":"en","TC":i*5,
+            "AU":[f"Smith{i} J.",f"Doe{i} A."],"AF":[f"Smith{i}, John",f"Doe{i}, Alice"],
+            "C1":[f"University {i}, City, USA",f"Lab {i}, Paris, France"],
+            "RP":f"Smith{i}, John","CR":[f"Ref{i}a 2020 NAT V1",f"Ref{i}b 2019 SCI V2"],
+            "DE":["machine learning","deep learning",f"topic{i}"],
+            "ID":["artificial intelligence","neural network"],
+            "AB":f"Abstract {i}. Results on ML topic {i}.",
+            "VL":str(10+i),"IS":str(i+1),"BP":str(100+i),"EP":str(110+i)}
+           for i in range(30)]
+
+df = transform(pd.DataFrame(records))
+print(f"✅ DataFrame: {len(df)} rows\n")
+
+ok, fail, skip = [], [], []
+
+def test(name, fn):
+    try:
+        fn()
+        ok.append(name)
+        print(f"✅ {name}")
+    except Exception as e:
+        fail.append((name, str(e)[:80]))
+        print(f"❌ {name}: {str(e)[:80]}")
+
+def skip_ui(name):
+    skip.append(name)
+    print(f"⏭️  {name} (Shiny UI args)")
+
+# ── All functions ──────────────────────────────────────────
+from functions.get_filters import get_filters
+test("get_filters", lambda: get_filters(df))
+
+from functions.get_status import get_status
+test("get_status", lambda: get_status([0,5,15,35,75,100]))
+
+from functions.get_bradfordlaw import get_bradford_law
+test("get_bradford_law", lambda: get_bradford_law(df))
+
+from functions.get_thematicmap import get_thematic_map
+test("get_thematic_map", lambda: get_thematic_map(df))
+
+from functions.get_worldmapcollaboration import get_world_map_collaboration
+test("get_world_map_collaboration", lambda: get_world_map_collaboration(df))
+
+from functions.get_relevantauthors import get_relevant_authors
+test("get_relevant_authors", lambda: get_relevant_authors(df, num_of_authors=10))
+
+from functions.get_relevantsources import get_relevant_sources
+test("get_relevant_sources", lambda: get_relevant_sources(df, num_of_sources=10))
+
+from functions.get_authorproductionovertime import get_author_production_over_time
+test("get_author_production_over_time", lambda: get_author_production_over_time(df, top_k_authors=5))
+
+from functions.get_affiliationproductionovertime import get_affiliation_production_over_time
+test("get_affiliation_production_over_time", lambda: get_affiliation_production_over_time(df, top_k_affiliations=5))
+
+from functions.get_localcitedreferences import get_local_cited_refs
+test("get_local_cited_refs", lambda: get_local_cited_refs(df, num_of_cited_refs=10, field_separator=";"))
+
+from functions.get_threefieldplot import get_three_field_plot
+test("get_three_field_plot", lambda: get_three_field_plot(
+    df, left_field="AU", middle_field="DE", right_field="SO",
+    left_field_items=10, middle_field_items=10, right_field_items=10))
+
+from functions.get_frequentwords import get_frequent_words
+test("get_frequent_words", lambda: get_frequent_words(
+    df, ngram=1, num_of_words=20, word_type="DE",
+    file_upload_terms=None, file_upload_synonyms=None))
+
+from functions.get_collaborationnetwork import get_collaboration_network
+test("get_collaboration_network", lambda: get_collaboration_network(
+    df, field="COL_AU", network_layout="fr", clustering_algorithm="louvain",
+    repulsion=100, shape="dot", opacity=0.9, shadow=False, curved=False,
+    colnormalize="association", labelsize=14, edgesize=1,
+    label_cex=True, nodes=50, isolates=False, edges_min=1))
+
+from functions.get_cocitation import get_co_citation
+test("get_co_citation", lambda: get_co_citation(
+    df, field="CR", sep=";", cocit_network_layout="fr",
+    cocit_clustering_algorithm="louvain", cocit_repulsion=100,
+    cocit_shape="dot", cocit_shadow=False, cocit_curved=False,
+    citlabelsize=14, citedgesize=1, citlabel_cex=True,
+    citNodes=50, cit_isolates=False, citedges_min=1))
+
+from functions.get_annualproduction import get_annual_production
+test("get_annual_production", lambda: get_annual_production(df))
+
+from functions.get_averagecitations import get_average_citations
+test("get_average_citations", lambda: get_average_citations(df))
+
+from functions.get_maininformations import get_main_informations
+test("get_main_informations", lambda: get_main_informations(df))
+
+from functions.get_countriesproduction import get_countries_production
+test("get_countries_production", lambda: get_countries_production(df))
+
+from functions.get_countriesproductionovertime import get_countries_production_over_time
+test("get_countries_production_over_time", lambda: get_countries_production_over_time(df))
+
+from functions.get_sourcesproduction import get_sources_production
+test("get_sources_production", lambda: get_sources_production(df))
+
+from functions.get_relevantaffiliations import get_relevant_affiliations
+test("get_relevant_affiliations", lambda: get_relevant_affiliations(df))
+
+from functions.get_lotkalaw import get_lotka_law
+test("get_lotka_law", lambda: get_lotka_law(df))
+
+from functions.get_treemap import get_treemap
+test("get_treemap", lambda: get_treemap(df))
+
+from functions.get_trendtopics import get_trend_topics
+test("get_trend_topics", lambda: get_trend_topics(df))
+
+from functions.get_wordfrequency import get_word_frequency
+test("get_word_frequency", lambda: get_word_frequency(df))
+
+from functions.get_table import get_table
+test("get_table", lambda: get_table(df))
+
+from functions.get_database import get_database
+test("get_database", lambda: get_database(df))
+
+from functions.get_data import get_data
+test("get_data", lambda: get_data(df))
+
+from functions.get_citedcountries import get_cited_countries
+test("get_cited_countries", lambda: get_cited_countries(df))
+
+from functions.get_citeddocuments import get_cited_documents
+test("get_cited_documents", lambda: get_cited_documents(df))
+
+from functions.get_correspondingauthorcountries import get_corresponding_author_countries
+test("get_corresponding_author_countries", lambda: get_corresponding_author_countries(df))
+
+from functions.get_localcitedauthors import get_local_cited_authors
+test("get_local_cited_authors", lambda: get_local_cited_authors(df))
+
+from functions.get_localciteddocuments import get_local_cited_documents
+test("get_local_cited_documents", lambda: get_local_cited_documents(df))
+
+from functions.get_localcitedsources import get_local_cited_sources
+test("get_local_cited_sources", lambda: get_local_cited_sources(df))
+
+from functions.get_sourceslocalimpact import get_sources_local_impact
+test("get_sources_local_impact", lambda: get_sources_local_impact(df))
+
+from functions.get_authorlocalimpact import get_author_local_impact
+test("get_author_local_impact", lambda: get_author_local_impact(df))
+
+from functions.get_historiograph import get_historiograph
+test("get_historiograph", lambda: get_historiograph(df))
+
+from functions.get_referencesspectroscopy import get_references_spectroscopy
+test("get_references_spectroscopy", lambda: get_references_spectroscopy(df))
+
+from functions.get_clusteringcoupling import get_clustering_coupling
+test("get_clustering_coupling", lambda: get_clustering_coupling(df))
+
+from functions.get_factorialanalysis import get_factorial_analysis
+test("get_factorial_analysis", lambda: get_factorial_analysis(df))
+
+# ── UI-dependent ───────────────────────────────────────────
+for name in ["get_wordcloud","get_co_occurence_network","get_thematic_evolution"]:
+    skip_ui(name)
+
+# ── Summary ───────────────────────────────────────────────
+print(f"\n{'='*45}")
+print(f"✅ PASSED : {len(ok)}")
+print(f"❌ FAILED : {len(fail)}")
+print(f"⏭️  SKIPPED: {len(skip)}")
+if fail:
+    print("\nFailed:")
+    for n, e in fail:
+        print(f"  ❌ {n}: {e}")
+print(f"{'='*45}")
diff --git a/test_etl_v5.py b/test_etl_v5.py
new file mode 100644
index 000000000..9cb893d59
--- /dev/null
+++ b/test_etl_v5.py
@@ -0,0 +1,231 @@
+"""ETL test v5 - all functions with correct arguments"""
+import sys, warnings
+sys.path.insert(0, '.')
+warnings.filterwarnings('ignore')
+import pandas as pd
+from www.services.etl.transformers import transform
+import importlib, sys
+
+def fresh_import(module_path, fn_name):
+    """Always reload module to get latest patches"""
+    if module_path in sys.modules:
+        del sys.modules[module_path]
+    mod = __import__(module_path, fromlist=[fn_name])
+    return getattr(mod, fn_name)
+
+records = [{"DB":"OPENALEX","UT":f"W{i}","DI":f"10.1234/{i}","PMID":"",
+            "TI":f"Article about machine learning number {i}",
+            "SO":["Nature","Science","Cell","PNAS","Lancet"][i%5],
+            "JI":"Nat Mach Intell","J9":"NAT MACH INTELL",
+            "PY":str(2018+i%6),"DT":"article","LA":"en","TC":i*5,
+            "AU":[f"Smith{i} J.",f"Doe{i} A."],"AF":[f"Smith{i}, John",f"Doe{i}, Alice"],
+            "C1":[f"University {i}, City, USA",f"Lab {i}, Paris, France"],
+            "RP":f"Smith{i}, John","CR":[f"Ref{i}a 2020 NAT V1",f"Ref{i}b 2019 SCI V2"],
+            "DE":["machine learning","deep learning",f"topic{i}"],
+            "ID":["artificial intelligence","neural network"],
+            "AB":f"Abstract {i}. Results on ML topic {i}.",
+            "VL":str(10+i),"IS":str(i+1),"BP":str(100+i),"EP":str(110+i)}
+           for i in range(30)]
+
+df = transform(pd.DataFrame(records))
+print(f"✅ DataFrame: {len(df)} rows\n")
+
+ok, fail, skip = [], [], []
+
+def test(name, fn):
+    try:
+        fn()
+        ok.append(name)
+        print(f"✅ {name}")
+    except Exception as e:
+        fail.append((name, str(e)[:100]))
+        print(f"❌ {name}: {str(e)[:100]}")
+
+def skip_ui(name):
+    skip.append(name)
+    print(f"⏭️  {name} (UI args)")
+
+# ── Already passing ────────────────────────────────────────
+from functions.get_filters import get_filters
+test("get_filters", lambda: get_filters(df))
+
+from functions.get_status import get_status
+test("get_status", lambda: get_status([0,5,15,35,75,100]))
+
+from functions.get_bradfordlaw import get_bradford_law
+test("get_bradford_law", lambda: get_bradford_law(df))
+
+from functions.get_thematicmap import get_thematic_map
+test("get_thematic_map", lambda: get_thematic_map(df))
+
+from functions.get_worldmapcollaboration import get_world_map_collaboration
+test("get_world_map_collaboration", lambda: get_world_map_collaboration(df))
+
+from functions.get_relevantauthors import get_relevant_authors
+test("get_relevant_authors", lambda: get_relevant_authors(df, num_of_authors=10))
+
+from functions.get_relevantsources import get_relevant_sources
+test("get_relevant_sources", lambda: get_relevant_sources(df, num_of_sources=10))
+
+from functions.get_authorproductionovertime import get_author_production_over_time
+test("get_author_production_over_time", lambda: get_author_production_over_time(df, top_k_authors=5))
+
+from functions.get_affiliationproductionovertime import get_affiliation_production_over_time
+test("get_affiliation_production_over_time", lambda: get_affiliation_production_over_time(df, top_k_affiliations=5))
+
+from functions.get_localcitedreferences import get_local_cited_refs
+test("get_local_cited_refs", lambda: get_local_cited_refs(df, num_of_cited_refs=10, field_separator=";"))
+
+from functions.get_threefieldplot import get_three_field_plot
+test("get_three_field_plot", lambda: get_three_field_plot(
+    df, left_field="AU", middle_field="DE", right_field="SO",
+    left_field_items=10, middle_field_items=10, right_field_items=10))
+
+from functions.get_frequentwords import get_frequent_words
+test("get_frequent_words", lambda: get_frequent_words(
+    df, ngram=1, num_of_words=20, word_type="DE",
+    file_upload_terms=None, file_upload_synonyms=None))
+
+from functions.get_collaborationnetwork import get_collaboration_network
+test("get_collaboration_network", lambda: get_collaboration_network(
+    df, field="COL_AU", network_layout="fr", clustering_algorithm="louvain",
+    repulsion=100, shape="dot", opacity=0.9, shadow=False, curved=False,
+    colnormalize="association", labelsize=14, edgesize=1,
+    label_cex=True, nodes=50, isolates=False, edges_min=1))
+
+from functions.get_cocitation import get_co_citation
+test("get_co_citation", lambda: get_co_citation(
+    df, field="CR", sep=";", cocit_network_layout="fr",
+    cocit_clustering_algorithm="louvain", cocit_repulsion=100,
+    cocit_shape="dot", cocit_shadow=False, cocit_curved=False,
+    citlabelsize=14, citedgesize=1, citlabel_cex=True,
+    citNodes=50, cit_isolates=False, citedges_min=1))
+
+from functions.get_annualproduction import get_annual_production
+test("get_annual_production", lambda: get_annual_production(df))
+
+from functions.get_averagecitations import get_average_citations
+test("get_average_citations", lambda: get_average_citations(df))
+
+from functions.get_maininformations import get_main_informations
+test("get_main_informations", lambda: get_main_informations(df))
+
+from functions.get_countriesproduction import get_countries_production
+test("get_countries_production", lambda: get_countries_production(df))
+
+# ── Now with correct args ──────────────────────────────────
+from functions.get_countriesproductionovertime import get_countries_production_over_time
+test("get_countries_production_over_time", lambda: get_countries_production_over_time(df, top_k_countries=5))
+
+from functions.get_sourcesproduction import get_sources_production
+test("get_sources_production", lambda: get_sources_production(df, num_of_sources_production=10, occurences='Frequency'))
+
+from functions.get_relevantaffiliations import get_relevant_affiliations
+test("get_relevant_affiliations", lambda: get_relevant_affiliations(df, num_of_affiliations=10, disambiguation=False))
+
+from functions.get_treemap import get_treemap
+test("get_treemap", lambda: get_treemap(
+    df, ngram=1, num_of_words=20, word_type="DE",
+    file_upload_terms=None, file_upload_synonyms=None))
+
+from functions.get_trendtopics import get_trend_topics
+test("get_trend_topics", lambda: get_trend_topics(df, ngram=1, field_tt="DE", time_window=3,
+    file_upload_terms_tt=None, file_upload_synonyms_tt=None,
+    word_minimum_frequency=1, number_of_words_year=5))
+
+from functions.get_wordfrequency import get_word_frequency
+test("get_word_frequency", lambda: get_word_frequency(df, ngram=1, field_wf="DE",
+    file_upload_terms_wf=None, file_upload_synonyms_wf=None,
+    occurrences="cumulate", top_words=20))
+
+from functions.get_citedcountries import get_cited_countries
+test("get_cited_countries", lambda: get_cited_countries(df, num_of_cited_countries=10, cited_countries_measure='Frequency'))
+
+from functions.get_citeddocuments import get_cited_documents
+test("get_cited_documents", lambda: get_cited_documents(df, num_of_cited_docs=10, cited_docs_measure='Frequency'))
+
+from functions.get_correspondingauthorcountries import get_corresponding_author_countries
+test("get_corresponding_author_countries", lambda: get_corresponding_author_countries(df, top_k_countries=5))
+
+import importlib, functions.get_localcitedauthors as _lca_mod; importlib.reload(_lca_mod); get_local_cited_authors = fresh_import("functions.get_localcitedauthors", "get_local_cited_authors")
+test("get_local_cited_authors", lambda: get_local_cited_authors(df, num_of_cited_authors=10, fast_search=True))
+
+import functions.get_localciteddocuments as _lcd_mod; importlib.reload(_lcd_mod); get_local_cited_documents = fresh_import("functions.get_localciteddocuments", "get_local_cited_documents")
+test("get_local_cited_documents", lambda: get_local_cited_documents(df, num_of_local_cited_docs=10, field_separator=";", fast_search=True))
+
+from functions.get_localcitedsources import get_local_cited_sources
+test("get_local_cited_sources", lambda: get_local_cited_sources(df, num_of_cited_sources=10))
+
+from functions.get_sourceslocalimpact import get_sources_local_impact
+test("get_sources_local_impact", lambda: get_sources_local_impact(df, num_of_sources_local_impact=10, source_local_impact='Frequency'))
+
+from functions.get_authorlocalimpact import get_author_local_impact
+test("get_author_local_impact", lambda: get_author_local_impact(df))
+
+from functions.get_historiograph import get_historiograph
+test("get_historiograph", lambda: get_historiograph(df))
+
+from functions.get_referencesspectroscopy import get_references_spectroscopy
+test("get_references_spectroscopy", lambda: get_references_spectroscopy(df))
+
+from functions.get_clusteringcoupling import get_clustering_coupling
+test("get_clustering_coupling", lambda: get_clustering_coupling(df))
+
+from functions.get_lotkalaw import get_lotka_law
+test("get_lotka_law", lambda: get_lotka_law(df))
+
+from functions.get_factorialanalysis import get_factorial_analysis
+test("get_factorial_analysis", lambda: get_factorial_analysis(df))
+
+from functions.get_table import get_table
+test("get_table", lambda: get_table(df, df))
+
+from functions.get_data import get_data
+test("get_data", lambda: get_data("OPENALEX", df))
+
+# ── UI-dependent ───────────────────────────────────────────
+for name in ["get_wordcloud","get_co_occurence_network","get_thematic_evolution","get_database"]:
+    skip_ui(name)
+
+print("\n=== Testing remaining functions ===")
+
+from functions.get_authorlocalimpact import get_authors_local_impact
+test("get_authors_local_impact", lambda: get_authors_local_impact(
+    df, num_of_authors_local_impact=10, author_local_impact="LCS"))
+
+from functions.get_clusteringcoupling import get_clustering_coupling
+test("get_clustering_coupling", lambda: get_clustering_coupling(
+    df, unit_of_analysis="documents", coupling_measured="references",
+    stemmer=False, impact_measure="local"))
+
+from functions.get_factorialanalysis import get_factorial_analysis
+test("get_factorial_analysis", lambda: get_factorial_analysis(df))
+
+from functions.get_historiograph import get_historiograph
+test("get_historiograph", lambda: get_historiograph(df))
+
+from functions.get_lotkalaw import get_lotka_law
+test("get_lotka_law", lambda: get_lotka_law(df))
+
+from functions.get_referencesspectroscopy import get_references_spectroscopy
+test("get_references_spectroscopy", lambda: get_references_spectroscopy(
+    df, start_year=2018, end_year=2024, field_separator_spec=";"))
+
+from functions.get_table import get_table
+test("get_table", lambda: get_table("OPENALEX", df))
+
+from functions.get_data import get_data
+test("get_data", lambda: get_data(None, "OPENALEX", df))
+
+# get_database needs Shiny input object
+skip_ui("get_database")
+
+print(f"\n{'='*45}")
+print(f"✅ PASSED : {len(ok)}")
+print(f"❌ FAILED : {len(fail)}")
+print(f"⏭️  SKIPPED: {len(skip)}")
+if fail:
+    print("\nFailed:")
+    for n, e in fail:
+        print(f"  ❌ {n}: {e}")
+print(f"{'='*45}")
diff --git a/test_final.py b/test_final.py
new file mode 100644
index 000000000..43b13640d
--- /dev/null
+++ b/test_final.py
@@ -0,0 +1,188 @@
+"""Final test - ALL 43 functions"""
+import sys, warnings, traceback
+sys.path.insert(0, '.')
+warnings.filterwarnings('ignore')
+# Clear all cached modules
+for key in list(sys.modules.keys()):
+    if 'functions.' in key:
+        del sys.modules[key]
+
+import pandas as pd
+from www.services.etl.transformers import transform
+
+records = [{"DB":"OPENALEX","UT":f"W{i}","DI":f"10.1234/{i}","PMID":"",
+            "TI":f"Article about machine learning {i}",
+            "SO":["Nature","Science","Cell","PNAS","Lancet"][i%5],
+            "JI":"Nat Mach Intell","J9":"NAT MACH INTELL",
+            "PY":str(2018+i%6),"DT":"article","LA":"en","TC":i*5,
+            "AU":[f"Smith{i} J.",f"Doe{i} A."],"AF":[f"Smith{i}, John",f"Doe{i}, Alice"],
+            "C1":[f"University {i}, City, USA",f"Lab {i}, Paris, France"],
+            "RP":f"Smith{i}, John",
+            "CR":[f"Smith{i} J., 2020, NAT V1", f"Doe{i} A., 2019, SCI V2"],
+            "DE":["machine learning","deep learning",f"topic{i}"],
+            "ID":["artificial intelligence","neural network"],
+            "AB":f"Abstract {i}. Results on ML topic {i}.",
+            "VL":str(10+i),"IS":str(i+1),"BP":str(100+i),"EP":str(110+i)}
+           for i in range(30)]
+
+df = transform(pd.DataFrame(records))
+print(f"✅ DataFrame: {len(df)} rows, {len(df.columns)} cols\n")
+
+ok, fail, skip = [], [], []
+
+def test(name, fn):
+    try:
+        fn()
+        ok.append(name)
+        print(f"✅ {name}")
+    except Exception as e:
+        fail.append((name, str(e)[:80]))
+        print(f"❌ {name}: {str(e)[:80]}")
+
+def skip_ui(name):
+    skip.append(name)
+    print(f"⏭️  {name} (UI)")
+
+# All 43 functions
+from functions.get_filters import get_filters
+test("get_filters", lambda: get_filters(df))
+
+from functions.get_status import get_status
+test("get_status", lambda: get_status([0,5,15,35,75,100]))
+
+from functions.get_annualproduction import get_annual_production
+test("get_annual_production", lambda: get_annual_production(df))
+
+from functions.get_averagecitations import get_average_citations
+test("get_average_citations", lambda: get_average_citations(df))
+
+from functions.get_maininformations import get_main_informations
+test("get_main_informations", lambda: get_main_informations(df))
+
+from functions.get_bradfordlaw import get_bradford_law
+test("get_bradford_law", lambda: get_bradford_law(df))
+
+from functions.get_countriesproduction import get_countries_production
+test("get_countries_production", lambda: get_countries_production(df))
+
+from functions.get_countriesproductionovertime import get_countries_production_over_time
+test("get_countries_production_over_time", lambda: get_countries_production_over_time(df, top_k_countries=5))
+
+from functions.get_sourcesproduction import get_sources_production
+test("get_sources_production", lambda: get_sources_production(df, num_of_sources_production=10, occurences='Frequency'))
+
+from functions.get_relevantauthors import get_relevant_authors
+test("get_relevant_authors", lambda: get_relevant_authors(df, num_of_authors=10))
+
+from functions.get_relevantsources import get_relevant_sources
+test("get_relevant_sources", lambda: get_relevant_sources(df, num_of_sources=10))
+
+from functions.get_relevantaffiliations import get_relevant_affiliations
+test("get_relevant_affiliations", lambda: get_relevant_affiliations(df, num_of_affiliations=10, disambiguation=False))
+
+from functions.get_authorproductionovertime import get_author_production_over_time
+test("get_author_production_over_time", lambda: get_author_production_over_time(df, top_k_authors=5))
+
+from functions.get_affiliationproductionovertime import get_affiliation_production_over_time
+test("get_affiliation_production_over_time", lambda: get_affiliation_production_over_time(df, top_k_affiliations=5))
+
+from functions.get_correspondingauthorcountries import get_corresponding_author_countries
+test("get_corresponding_author_countries", lambda: get_corresponding_author_countries(df, top_k_countries=5))
+
+from functions.get_authorlocalimpact import get_authors_local_impact
+test("get_authors_local_impact", lambda: get_authors_local_impact(df, num_of_authors_local_impact=10, author_local_impact="LCS"))
+
+from functions.get_sourceslocalimpact import get_sources_local_impact
+test("get_sources_local_impact", lambda: get_sources_local_impact(df, num_of_sources_local_impact=10, source_local_impact='Frequency'))
+
+from functions.get_citedcountries import get_cited_countries
+test("get_cited_countries", lambda: get_cited_countries(df, num_of_cited_countries=10, cited_countries_measure='Frequency'))
+
+from functions.get_citeddocuments import get_cited_documents
+test("get_cited_documents", lambda: get_cited_documents(df, num_of_cited_docs=10, cited_docs_measure='Frequency'))
+
+from functions.get_localcitedreferences import get_local_cited_refs
+test("get_local_cited_refs", lambda: get_local_cited_refs(df, num_of_cited_refs=10, field_separator=";"))
+
+from functions.get_localcitedauthors import get_local_cited_authors
+test("get_local_cited_authors", lambda: get_local_cited_authors(df, num_of_cited_authors=10, fast_search=True))
+
+from functions.get_localciteddocuments import get_local_cited_documents
+test("get_local_cited_documents", lambda: get_local_cited_documents(df, num_of_local_cited_docs=10, field_separator=";", fast_search=True))
+
+from functions.get_localcitedsources import get_local_cited_sources
+test("get_local_cited_sources", lambda: get_local_cited_sources(df, num_of_cited_sources=10))
+
+from functions.get_frequentwords import get_frequent_words
+test("get_frequent_words", lambda: get_frequent_words(df, ngram=1, num_of_words=20, word_type="DE", file_upload_terms=None, file_upload_synonyms=None))
+
+from functions.get_wordfrequency import get_word_frequency
+test("get_word_frequency", lambda: get_word_frequency(df, ngram=1, field_wf="DE", file_upload_terms_wf=None, file_upload_synonyms_wf=None, occurrences="cumulate", top_words=20))
+
+from functions.get_treemap import get_treemap
+test("get_treemap", lambda: get_treemap(df, ngram=1, num_of_words=20, word_type="DE", file_upload_terms=None, file_upload_synonyms=None))
+
+from functions.get_trendtopics import get_trend_topics
+test("get_trend_topics", lambda: get_trend_topics(df, ngram=1, field_tt="DE", time_window=3, file_upload_terms_tt=None, file_upload_synonyms_tt=None, word_minimum_frequency=1, number_of_words_year=5))
+
+from functions.get_threefieldplot import get_three_field_plot
+test("get_three_field_plot", lambda: get_three_field_plot(df, left_field="AU", middle_field="DE", right_field="SO", left_field_items=10, middle_field_items=10, right_field_items=10))
+
+from functions.get_thematicmap import get_thematic_map
+test("get_thematic_map", lambda: get_thematic_map(df))
+
+from functions.get_worldmapcollaboration import get_world_map_collaboration
+test("get_world_map_collaboration", lambda: get_world_map_collaboration(df))
+
+from functions.get_collaborationnetwork import get_collaboration_network
+test("get_collaboration_network", lambda: get_collaboration_network(
+    df, field="COL_AU", network_layout="fr", clustering_algorithm="louvain",
+    repulsion=100, shape="dot", opacity=0.9, shadow=False, curved=False,
+    colnormalize="association", labelsize=14, edgesize=1,
+    label_cex=True, nodes=50, isolates=False, edges_min=1))
+
+from functions.get_cocitation import get_co_citation
+test("get_co_citation", lambda: get_co_citation(
+    df, field="CR", sep=";", cocit_network_layout="fr",
+    cocit_clustering_algorithm="louvain", cocit_repulsion=100,
+    cocit_shape="dot", cocit_shadow=False, cocit_curved=False,
+    citlabelsize=14, citedgesize=1, citlabel_cex=True,
+    citNodes=50, cit_isolates=False, citedges_min=1))
+
+from functions.get_clusteringcoupling import get_clustering_coupling
+test("get_clustering_coupling", lambda: get_clustering_coupling(
+    df, unit_of_analysis="documents", coupling_measured="references",
+    stemmer=False, impact_measure="local"))
+
+from functions.get_lotkalaw import get_lotka_law
+test("get_lotka_law", lambda: get_lotka_law(df))
+
+from functions.get_historiograph import get_historiograph
+test("get_historiograph", lambda: get_historiograph(df))
+
+from functions.get_referencesspectroscopy import get_references_spectroscopy
+test("get_references_spectroscopy", lambda: get_references_spectroscopy(
+    df, start_year=2018, end_year=2024, field_separator_spec=";"))
+
+from functions.get_factorialanalysis import get_factorial_analysis
+test("get_factorial_analysis", lambda: get_factorial_analysis(df))
+
+from functions.get_table import get_table
+test("get_table", lambda: get_table("OPENALEX", df))
+
+from functions.get_data import get_data
+test("get_data", lambda: get_data(None, "OPENALEX", df))
+
+# UI-dependent
+for name in ["get_wordcloud", "get_co_occurence_network", "get_thematic_evolution", "get_database"]:
+    skip_ui(name)
+
+print(f"\n{'='*45}")
+print(f"✅ PASSED : {len(ok)} / {len(ok)+len(fail)}")
+print(f"❌ FAILED : {len(fail)}")
+print(f"⏭️  SKIPPED: {len(skip)} (UI)")
+if fail:
+    print("\nFailed:")
+    for n, e in fail:
+        print(f"  ❌ {n}: {e}")
+print(f"{'='*45}")
diff --git a/test_functions.py b/test_functions.py
new file mode 100644
index 000000000..19826b3fb
--- /dev/null
+++ b/test_functions.py
@@ -0,0 +1,112 @@
+import sys
+import importlib
+sys.path.insert(0, "www")
+sys.path.insert(0, "functions")
+
+import importlib.util
+spec = importlib.util.spec_from_file_location("standardizer", "www/services/standardizer.py")
+_mod = importlib.util.module_from_spec(spec)
+spec.loader.exec_module(_mod)
+convert2df = _mod.convert2df
+
+print("Fetching OpenAlex data...")
+df = convert2df("machine learning", source="openalex", max_results=50, verbose=False)
+print(f"OpenAlex DataFrame ready: {len(df)} records\n")
+
+print("Fetching PubMed data...")
+df_pubmed = convert2df("machine learning", source="pubmed", max_results=50, verbose=False)
+print(f"PubMed DataFrame ready: {len(df_pubmed)} records\n")
+
+functions = [
+    ("get_affiliationproductionovertime", "get_affiliation_production_over_time", {"top_k_affiliations": 10}, df),
+    ("get_annualproduction",              "get_annual_production",                 {}, df),
+    ("get_authorlocalimpact",             "get_authors_local_impact",              {"num_of_authors_local_impact": 10, "author_local_impact": "h_index"}, df),
+    ("get_authorproductionovertime",      "get_author_production_over_time",       {"top_k_authors": 10}, df),
+    ("get_averagecitations",              "get_average_citations",                 {}, df),
+    ("get_bradfordlaw",                   "get_bradford_law",                      {}, df),
+    ("get_citedcountries",               "get_cited_countries",                   {"num_of_cited_countries": 10, "cited_countries_measure": "frequency"}, df),
+    ("get_citeddocuments",               "get_cited_documents",                   {"num_of_cited_docs": 10, "cited_docs_measure": "frequency"}, df),
+    ("get_countriesproduction",          "get_countries_production",              {}, df),
+    ("get_countriesproductionovertime",  "get_countries_production_over_time",    {"top_k_countries": 10}, df),
+    ("get_correspondingauthorcountries", "get_corresponding_author_countries",    {"top_k_countries": 10}, df),
+    ("get_frequentwords",                "get_frequent_words",                    {"ngram": 1, "num_of_words": 20, "word_type": "DE", "file_upload_terms": None, "file_upload_synonyms": None}, df),
+    ("get_historiograph",                "get_historiograph",                     {}, df_pubmed),
+    ("get_localcitedauthors",            "get_local_cited_authors",               {"num_of_cited_authors": 10}, df_pubmed),
+    ("get_localciteddocuments",          "get_local_cited_documents",             {"num_of_local_cited_docs": 10, "field_separator": ";"}, df_pubmed),
+    ("get_localcitedreferences",         "get_local_cited_refs",                  {"num_of_cited_refs": 10, "field_separator": ";"}, df_pubmed),
+    ("get_localcitedsources",            "get_local_cited_sources",               {"num_of_cited_sources": 10}, df_pubmed),
+    ("get_lotkalaw",                     "get_lotka_law",                         {}, df),
+    ("get_maininformations",             "get_main_informations",                 {}, df),
+    ("get_referencesspectroscopy",       "get_references_spectroscopy",           {"start_year": 2000}, df_pubmed),
+    ("get_relevantaffiliations",         "get_relevant_affiliations",             {"num_of_affiliations": 10, "disambiguation": False}, df),
+    ("get_relevantauthors",              "get_relevant_authors",                  {"num_of_authors": 10}, df),
+    ("get_relevantsources",              "get_relevant_sources",                  {"num_of_sources": 10}, df),
+    ("get_sourceslocalimpact",           "get_sources_local_impact",              {"num_of_sources_local_impact": 10, "source_local_impact": "h_index"}, df),
+    ("get_sourcesproduction",            "get_sources_production",                {"num_of_sources_production": 10, "occurences": "frequency"}, df),
+    ("get_thematicmap",                  "get_thematic_map",                      {}, df),
+    ("get_thematicevolution",            "get_thematic_evolution",                {"years": [2020, 2023]}, df),
+    ("get_threefieldplot",               "get_three_field_plot",                  {"left_field": "AU", "middle_field": "DE", "right_field": "SO", "left_field_items": 10, "middle_field_items": 10, "right_field_items": 10}, df),
+    ("get_treemap",                      "get_treemap",                           {"ngram": 1, "num_of_words": 20, "word_type": "DE", "file_upload_terms": None, "file_upload_synonyms": None}, df),
+    ("get_trendtopics",                  "get_trend_topics",                      {"ngram": 1, "field_tt": "DE", "time_window": [2015, 2025], "file_upload_terms_tt": None, "file_upload_synonyms_tt": None, "word_minimum_frequency": 1, "number_of_words_year": 3}, df),
+    ("get_wordcloud",                    "get_wordcloud",                         {"ngram": 1, "num_of_words_wc": 50, "field_wc": "DE", "file_upload_terms_wc": None, "file_upload_synonyms_wc": None}, df),
+    ("get_wordfrequency",                "get_word_frequency",                    {"ngram": 1, "field_wf": "DE", "file_upload_terms_wf": None, "file_upload_synonyms_wf": None, "occurrences": "frequency", "top_words": [20, 20]}, df),
+    ("get_worldmapcollaboration",        "get_world_map_collaboration",           {}, df),
+    ("get_filters",                      "get_filters",                           {}, df),
+    ("get_factorialanalysis",            "get_factorial_analysis",                {"field": "DE", "ngram": 1}, df),
+    ("get_clusteringcoupling",           "get_clustering_coupling",               {
+        "unit_of_analysis": "sources", "coupling_measured": "keywords",
+        "stemmer": False, "impact_measure": "h_index", "cluster_labeling": "freq",
+        "ngram": 1, "num_of_units": 10, "min_cluster_freq": 2,
+        "label_per_cluster": 3, "label_size": 10, "community_repulsion": 0.1,
+        "clustering_algorithm": "walktrap"
+    }, df),
+    ("get_co_occurence_network",         "get_co_occurence_network",              {
+        "field_cn": "DE", "ngram": 1, "network_layout": "fr",
+        "clustering_algorithm_cn": "walktrap", "normalization_cn": "association",
+        "color_by_year": False, "num_of_nodes": 50, "repulsion_force": 0.1,
+        "remove_isolated": True, "min_edges": 1, "node_opacity": 0.8,
+        "num_of_labels": 10, "node_shape": "dot", "label_size_ls": 10,
+        "edge_size": 1, "node_shadow": False, "edit_nodes": False,
+        "label_cex": 1, "file_upload_terms": None, "file_upload_synonyms": None
+    }, df),
+    ("get_cocitation",                   "get_co_citation",                       {
+        "field": "CR", "sep": ";", "cocit_network_layout": "fr",
+        "cocit_clustering_algorithm": "walktrap", "cocit_repulsion": 0.1,
+        "cocit_shape": "dot", "cocit_shadow": False, "cocit_curved": False,
+        "citlabelsize": 10, "citedgesize": 1, "citlabel_cex": 1,
+        "citNodes": 50, "cit_isolates": True, "citedges_min": 1
+    }, df_pubmed),
+    ("get_collaborationnetwork",         "get_collaboration_network",             {
+        "field": "COL_AU", "network_layout": "fr", "clustering_algorithm": "walktrap",
+        "repulsion": 0.1, "shape": "dot", "opacity": 0.8, "shadow": False,
+        "curved": False, "colnormalize": "association", "labelsize": 10,
+        "edgesize": 1, "label_cex": 1, "nodes": 50, "isolates": True, "edges_min": 1
+    }, df),
+]
+
+passed = []
+failed = []
+
+for module_name, func_name, kwargs, data in functions:
+    try:
+        mod = importlib.import_module(module_name)
+        func = getattr(mod, func_name, None)
+        if func is None:
+            failed.append((func_name, "function not found in module"))
+            print(f"  FAIL  {func_name}: function not found")
+            continue
+        func(data, **kwargs)
+        passed.append(func_name)
+        print(f"  PASS  {func_name}")
+    except Exception as e:
+        failed.append((func_name, str(e)))
+        print(f"  FAIL  {func_name}: {e}")
+
+print(f"\n{'='*50}")
+print(f"TOTAL PASSED: {len(passed)}/{len(functions)}")
+print(f"TOTAL FAILED: {len(failed)}/{len(functions)}")
+if failed:
+    print("\nFailed functions:")
+    for fn, err in failed:
+        print(f"  - {fn}: {err}")
+print(f"{'='*50}")
diff --git a/test_functions_dir.py b/test_functions_dir.py
new file mode 100644
index 000000000..99dd4bb19
--- /dev/null
+++ b/test_functions_dir.py
@@ -0,0 +1,75 @@
+import os, sys, traceback, importlib.util
+sys.path.insert(0, '.')
+sys.path.insert(0, './www')
+
+from www.services.etl.loader import load_standardized_csv
+df = load_standardized_csv('standardized_output.csv')
+print(f"Loaded {len(df)} records\n")
+
+# اسم فایل → اسم فانکشن اصلی
+FUNC_MAP = {
+    "get_affiliationproductionovertime": ("get_affiliation_production_over_time", [df, 5]),
+    "get_annualproduction":              ("get_annual_production", [df]),
+    "get_authorlocalimpact":             ("get_authors_local_impact", [df, 10, "h_index"]),
+    "get_authorproductionovertime":      ("get_author_production_over_time", [df, 5]),
+    "get_averagecitations":              ("get_average_citations", [df]),
+    "get_bradfordlaw":                   ("get_bradford_law", [df]),
+    "get_citedcountries":                ("get_cited_countries", [df, 10, "n"]),
+    "get_citeddocuments":                ("get_cited_documents", [df, 10, "n"]),
+    "get_correspondingauthorcountries":  ("get_corresponding_author_countries", [df, 10]),
+    "get_countriesproduction":           ("get_countries_production", [df]),
+    "get_countriesproductionovertime":   ("get_countries_production_over_time", [df, 5]),
+    "get_filters":                       ("get_filters", [df]),
+    "get_frequentwords":                 ("get_frequent_words", [df, 1, 20, "DE", None, None]),
+    "get_historiograph":                 ("get_historiograph", [df]),
+    "get_localcitedauthors":             ("get_local_cited_authors", [df, 10]),
+    "get_localciteddocuments":           ("get_local_cited_documents", [df, 10, ";"]),
+    "get_localcitedreferences":          ("get_local_cited_refs", [df, 10, ";"]),
+    "get_localcitedsources":             ("get_local_cited_sources", [df, 10]),
+    "get_lotkalaw":                      ("get_lotka_law", [df]),
+    "get_maininformations":              ("get_main_informations", [df]),
+    "get_referencesspectroscopy":        ("get_references_spectroscopy", [df, 2000]),
+    "get_relevantaffiliations":          ("get_relevant_affiliations", [df, 10, False]),
+    "get_relevantauthors":               ("get_relevant_authors", [df, 10]),
+    "get_relevantsources":               ("get_relevant_sources", [df, 10]),
+    "get_sourceslocalimpact":            ("get_sources_local_impact", [df, 10, "h_index"]),
+    "get_sourcesproduction":             ("get_sources_production", [df, 10, "n"]),
+    "get_thematicmap":                   ("get_thematic_map", [df]),
+    "get_thematicevolution":             ("get_thematic_evolution", [df, "ID", [2021, 2023, 2025]]),
+    "get_threefieldplot":                ("get_three_field_plot", [df, "AU", "DE", "SO", 10, 10, 10]),
+    "get_treemap":                       ("get_treemap", [df, 1, 20, "DE", None, None]),
+    "get_trendtopics":                   ("get_trend_topics", [df, 1, "DE", 3, None, None, 2, 5]),
+    "get_wordcloud":                     ("get_wordcloud", [df, 1, 50, "DE", None, None]),
+    "get_wordfrequency":                 ("get_word_frequency", [df, 1, "DE", None, None, "n", 20]),
+    "get_worldmapcollaboration":         ("get_world_map_collaboration", [df]),
+}
+
+passed, failed, warned = [], [], []
+
+for fname, (func_name, args) in FUNC_MAP.items():
+    fpath = f"./functions/{fname}.py"
+    if not os.path.exists(fpath):
+        print(f"⚠️  {fname}: file not found")
+        warned.append(fname)
+        continue
+    try:
+        spec = importlib.util.spec_from_file_location(fname, fpath)
+        mod = importlib.util.module_from_spec(spec)
+        spec.loader.exec_module(mod)
+        func = getattr(mod, func_name, None)
+        if func is None:
+            print(f"⚠️  {fname}: function '{func_name}' not found")
+            warned.append(fname)
+            continue
+        func(*args)
+        print(f"✅ {func_name}")
+        passed.append(fname)
+    except Exception as e:
+        print(f"❌ {func_name}: {type(e).__name__}: {e}")
+        failed.append((fname, e))
+
+print(f"\n{'='*50}")
+print(f"✅ Passed : {len(passed)}")
+print(f"❌ Failed : {len(failed)}")
+print(f"⚠️  Warned : {len(warned)}")
+print(f"{'='*50}")
diff --git a/test_openalex_output.csv b/test_openalex_output.csv
new file mode 100644
index 000000000..fe5ccd86e
--- /dev/null
+++ b/test_openalex_output.csv
@@ -0,0 +1,101 @@
+DB,UT,DI,PMID,TI,SO,JI,J9,PY,DT,LA,TC,AU,AF,C1,RP,CR,DE,ID,AB,VL,IS,BP,EP,SR,AU_UN,AU1_CO,C3
+OPENALEX,https://openalex.org/W2101234009,10.48550/arxiv.1201.0490,,Scikit-learn: Machine Learning in Python,arXiv (Cornell University),,,2012,preprint,en,63665,"['Pedregosa F.', 'Varoquaux G.', 'Gramfort A.', 'Michel V.', 'Thirion B.', 'Grisel O.', 'Blondel M.', 'Andreas M.', 'Joel N.', 'Gilles L.', 'Prettenhofer P.', 'Weiss R.', 'Dubourg V.', 'Vanderplas J.', 'Passos A.', 'Cournapeau D.', 'Brucher M.', 'Perrot M.', 'Duchesnay É.']","['Fabián Pedregosa', 'Gaël Varoquaux', 'Alexandre Gramfort', 'Vincent Michel', 'Bertrand Thirion', 'Olivier Grisel', 'Mathieu Blondel', 'Müller, Andreas', 'Nothman, Joel', 'Louppe, Gilles', 'Peter Prettenhofer', 'Ron J. Weiss', 'Vincent Dubourg', 'Jake Vanderplas', 'Alexandre Passos', 'David Cournapeau', 'Matthieu Brucher', 'Matthieu Perrot', 'Édouard Duchesnay']","[""Commissariat à l'Énergie Atomique et aux Énergies Alternatives"", 'CEA Paris-Saclay', ""Commissariat à l'Énergie Atomique et aux Énergies Alternatives"", 'CEA Paris-Saclay', ""Commissariat à l'Énergie Atomique et aux Énergies Alternatives"", 'CEA Paris-Saclay', ""Commissariat à l'Énergie Atomique et aux Énergies Alternatives"", 'CEA Paris-Saclay', ""Commissariat à l'Énergie Atomique et aux Énergies Alternatives"", 'CEA Paris-Saclay', 'Nuxe (France)', 'Kobe University', 'Bauhaus-Universität Weimar', 'Google (Canada)', 'University of Washington', 'Amherst College', 'University of Massachusetts Amherst', 'Enthought (United States)', 'Total (France)']",,[],"['Python (programming language)', 'Documentation', 'Computer science', 'MIT License', 'Artificial intelligence', 'Machine learning', 'Programming language', 'License', 'Software engineering', 'Operating system']","['Python (programming language)', 'Documentation', 'Computer science', 'MIT License', 'Artificial intelligence', 'Machine learning', 'Programming language', 'License', 'Software engineering', 'Operating system']",,,,,,Pedregosa 2012 arXiv VV0,Commissariat à l'Énergie Atomique et aux Énergies Alternatives;CEA Paris-Saclay;Commissariat à l'Énergie Atomique et aux Énergies Alternatives;CEA Paris-Saclay;Commissariat à l'Énergie Atomique et aux Énergies Alternatives;CEA Paris-Saclay;Commissariat à l'Énergie Atomique et aux Énergies Alternatives;CEA Paris-Saclay;Commissariat à l'Énergie Atomique et aux Énergies Alternatives;CEA Paris-Saclay;Nuxe (France);Kobe University;Bauhaus-Universität Weimar;Google (Canada);University of Washington;Amherst College;University of Massachusetts Amherst;Enthought (United States);Total (France),Commissariat à l'Énergie Atomique et aux Énergies Alternatives,Commissariat à l'Énergie Atomique et aux Énergies Alternatives;CEA Paris-Saclay;Commissariat à l'Énergie Atomique et aux Énergies Alternatives;CEA Paris-Saclay;Commissariat à l'Énergie Atomique et aux Énergies Alternatives;CEA Paris-Saclay;Commissariat à l'Énergie Atomique et aux Énergies Alternatives;CEA Paris-Saclay;Commissariat à l'Énergie Atomique et aux Énergies Alternatives;CEA Paris-Saclay;Nuxe (France);Kobe University;Bauhaus-Universität Weimar;Google (Canada);University of Washington;Amherst College;University of Massachusetts Amherst;Enthought (United States);Total (France)
+OPENALEX,https://openalex.org/W3023540311,10.5860/choice.27-0936,,"Genetic algorithms in search, optimization, and machine learning",Choice Reviews Online,,,1989,article,en,49332,[],[],[],,[],"['Computer science', 'Artificial intelligence', 'Machine learning', 'Quality control and genetic algorithms', 'Algorithm', 'Genetic algorithm', 'Meta-optimization']","['Computer science', 'Artificial intelligence', 'Machine learning', 'Quality control and genetic algorithms', 'Algorithm', 'Genetic algorithm', 'Meta-optimization']",,27,02,27,0936,UNKNOWN 1989 Choice V27,,,
+OPENALEX,https://openalex.org/W2125055259,,,C4.5: Programs for Machine Learning,,,,1992,book,en,23696,['Quinlan J.'],['J. R. Quinlan'],['University of Sydney'],,[],"['Computer science', 'Unix', 'Classifier (UML)', 'Machine learning', 'Artificial intelligence', 'Source code', 'Workstation', 'Software', 'Decision tree', 'Sample (material)', 'Software engineering', 'Data mining', 'Programming language', 'Operating system']","['Computer science', 'Unix', 'Classifier (UML)', 'Machine learning', 'Artificial intelligence', 'Source code', 'Workstation', 'Software', 'Decision tree', 'Sample (material)', 'Software engineering', 'Data mining', 'Programming language', 'Operating system', 'Chromatography', 'Chemistry']",,,,,,Quinlan 1992 UNKNOWNJ VV0,University of Sydney,University of Sydney,University of Sydney
+OPENALEX,https://openalex.org/W1570448133,10.1016/c2009-0-19715-5,,Data Mining: Practical Machine Learning Tools and Techniques,Elsevier eBooks,,,2011,book,en,25711,"['Witten I.', 'Frank E.', 'Hall M.']","['Ian H. Witten', 'Eibe Frank', 'Mark A. Hall']",[],,[],"['Computer science', 'Machine learning', 'Data science', 'Data mining', 'Artificial intelligence']","['Computer science', 'Machine learning', 'Data science', 'Data mining', 'Artificial intelligence']",,,,,,Witten 2011 Elsevier VV0,,,
+OPENALEX,https://openalex.org/W3120740533,,,UCI Machine Learning Repository,Medical Entomology and Zoology,,,2007,article,en,24320,['Asuncion A.'],['Arthur Asuncion'],[],,[],"['Computer science', 'Artificial intelligence']","['Computer science', 'Artificial intelligence']",,,,,,Asuncion 2007 Medical VV0,,,
+OPENALEX,https://openalex.org/W1663973292,10.1117/1.2819119,,Pattern Recognition and Machine Learning,Journal of Electronic Imaging,,,2007,article,en,22082,['Nasrabadi N.'],['Nasser M. Nasrabadi'],"['West Virginia University', 'Microsoft Research (United Kingdom)']",,[],"['Computer science', 'Imaging science', 'Cover (algebra)', 'Data science', 'Artificial intelligence', 'Engineering']","['Computer science', 'Imaging science', 'Cover (algebra)', 'Data science', 'Artificial intelligence', 'Engineering', 'Mechanical engineering']",,16,4,049901,049901,Nasrabadi 2007 Journal V16,West Virginia University;Microsoft Research (United Kingdom),West Virginia University,West Virginia University;Microsoft Research (United Kingdom)
+OPENALEX,https://openalex.org/W1639032689,,,"Genetic Algorithms in Search, Optimization and Machine Learning",,,,1988,book,en,17771,['Goldberg D.'],['David E. Goldberg'],[],,[],"['Pascal (unit)', 'Computer science', 'Genetic programming', 'Genetic algorithm', 'Machine learning', 'Artificial intelligence', 'Quality control and genetic algorithms', 'Theoretical computer science', 'Algorithm', 'Programming language', 'Meta-optimization']","['Pascal (unit)', 'Computer science', 'Genetic programming', 'Genetic algorithm', 'Machine learning', 'Artificial intelligence', 'Quality control and genetic algorithms', 'Theoretical computer science', 'Algorithm', 'Programming language', 'Meta-optimization']",,,,,,Goldberg 1988 UNKNOWNJ VV0,,,
+OPENALEX,https://openalex.org/W1583837637,10.1145/1273496,,Proceedings of the 24th international conference on Machine learning,,,,2007,preprint,en,11733,[],[],[],,[],"['Presentation (obstetrics)', 'Library science', 'Computer science', 'Medical education', 'Medicine']","['Presentation (obstetrics)', 'Library science', 'Computer science', 'Medical education', 'Medicine', 'Radiology']",,,,,,UNKNOWN 2007 UNKNOWNJ VV0,,,
+OPENALEX,https://openalex.org/W1503398984,,,Machine learning a probabilistic perspective,,,,2012,book,en,9327,['Murphy K.'],['Kevin P. Murphy'],[],,[],"['Computer science', 'Probabilistic logic', 'Artificial intelligence', 'Field (mathematics)', 'Conditional random field', 'Heuristic', 'Machine learning', 'Graphical model', 'Regularization (linguistics)', 'Software', 'Programming language']","['Computer science', 'Probabilistic logic', 'Artificial intelligence', 'Field (mathematics)', 'Conditional random field', 'Heuristic', 'Machine learning', 'Graphical model', 'Regularization (linguistics)', 'Software', 'Programming language', 'Pure mathematics', 'Mathematics']",,,,,,Murphy 2012 UNKNOWNJ VV0,,,
+OPENALEX,https://openalex.org/W1901616594,10.1126/science.aaa8415,26185243,"Machine learning: Trends, perspectives, and prospects",Science,,,2015,review,en,9497,"['Jordan M.', 'Mitchell T.']","['Michael I. Jordan', 'Tom M. Mitchell']","['University of California, Berkeley', 'Carnegie Mellon University']",,[],"['Intersection (aeronautics)', 'Computer science', 'Artificial intelligence', 'Core (optical fiber)', 'Data science', 'Machine learning', 'Big data', 'Computation', 'Lying', 'Engineering', 'Data mining']","['Intersection (aeronautics)', 'Computer science', 'Artificial intelligence', 'Core (optical fiber)', 'Data science', 'Machine learning', 'Big data', 'Computation', 'Lying', 'Engineering', 'Data mining', 'Aerospace engineering', 'Radiology', 'Telecommunications', 'Medicine', 'Algorithm']",,349,6245,255,260,Jordan 2015 Science V349,"University of California, Berkeley;Carnegie Mellon University",Berkeley,"University of California, Berkeley;Carnegie Mellon University"
+OPENALEX,https://openalex.org/W1746819321,10.7551/mitpress/3206.001.0001,,Gaussian Processes for Machine Learning,The MIT Press eBooks,,,2005,book,en,10487,"['Rasmussen C.', 'Williams C.']","['Carl Edward Rasmussen', 'Christopher K. I. Williams']","['Max Planck Institute for Biological Cybernetics', 'Max Planck Society']",,[],"['Machine learning', 'Artificial intelligence', 'Computer science', 'Online machine learning', 'Gaussian process', 'Probabilistic logic', 'Relevance vector machine', 'Support vector machine', 'Kernel method', 'Artificial neural network', 'Gaussian']","['Machine learning', 'Artificial intelligence', 'Computer science', 'Online machine learning', 'Gaussian process', 'Probabilistic logic', 'Relevance vector machine', 'Support vector machine', 'Kernel method', 'Artificial neural network', 'Gaussian', 'Quantum mechanics', 'Physics']",,,,,,Rasmussen 2005 The VV0,Max Planck Institute for Biological Cybernetics;Max Planck Society,Max Planck Institute for Biological Cybernetics,Max Planck Institute for Biological Cybernetics;Max Planck Society
+OPENALEX,https://openalex.org/W2997591727,10.5555/1953048.2078195,,Scikit-learn: Machine Learning in Python,Journal of Machine Learning Research,,,2011,article,en,8193,"['PedregosaFabian', 'VaroquauxGaël', 'GramfortAlexandre', 'MichelVincent', 'ThirionBertrand', 'GriselOlivier', 'BlondelMathieu', 'PrettenhoferPeter', 'WeissRon', 'DubourgVincent', 'VanderplasJake', 'PassosAlexandre', 'CournapeauDavid', 'BrucherMatthieu', 'PerrotMatthieu', 'DuchesnayÉdouard']","['PedregosaFabian', 'VaroquauxGaël', 'GramfortAlexandre', 'MichelVincent', 'ThirionBertrand', 'GriselOlivier', 'BlondelMathieu', 'PrettenhoferPeter', 'WeissRon', 'DubourgVincent', 'VanderplasJake', 'PassosAlexandre', 'CournapeauDavid', 'BrucherMatthieu', 'PerrotMatthieu', 'DuchesnayÉdouard']",[],,[],"['Python (programming language)', 'Computer science', 'Artificial intelligence', 'Machine learning', 'Programming language']","['Python (programming language)', 'Computer science', 'Artificial intelligence', 'Machine learning', 'Programming language']",,,,,,PedregosaFabian 2011 Journal VV0,,,
+OPENALEX,https://openalex.org/W4212863985,10.1007/978-0-387-45528-0,,Pattern Recognition and Machine Learning,,,,2006,book,en,9852,[],[],[],,[],"['Computer science', 'Artificial intelligence', 'Pattern recognition (psychology)']","['Computer science', 'Artificial intelligence', 'Pattern recognition (psychology)']",,,,,,UNKNOWN 2006 UNKNOWNJ VV0,,,
+OPENALEX,https://openalex.org/W2953384591,10.48550/arxiv.1605.08695,,TensorFlow: A system for large-scale machine learning,arXiv (Cornell University),,,2016,preprint,en,8815,"['Abadi M.', 'Barham P.', 'Chen J.', 'Chen Z.', 'Davis A.', 'Dean J.', 'Devin M.', 'Ghemawat S.', 'Irving G.', 'Isard M.', 'Kudlur M.', 'Levenberg J.', 'Monga R.', 'Moore S.', 'Murray D.', 'Steiner B.', 'Tucker P.', 'Vasudevan V.', 'Warden P.', 'Wicke M.', 'Yu Y.', 'Zheng X.']","['Martı́n Abadi', 'Paul Barham', 'Jianmin Chen', 'Zhifeng Chen', 'Andy Davis', 'Jay B. Dean', 'Matthieu Devin', 'Sanjay Ghemawat', 'Geoffrey Irving', 'Michael Isard', 'Manjunath Kudlur', 'Josh Levenberg', 'Rajat Monga', 'Sherry Moore', 'Derek G. Murray', 'Benoit Steiner', 'Paul A. Tucker', 'Vijay Vasudevan', 'Pete Warden', 'Martin Wicke', 'Yuan Yu', 'Xiaoqiang Zheng']","['Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)']",,[],"['Scale (ratio)', 'Computer science', 'Artificial intelligence', 'Machine learning', 'Cartography', 'Geography']","['Scale (ratio)', 'Computer science', 'Artificial intelligence', 'Machine learning', 'Cartography', 'Geography']",,,,,,Abadi 2016 arXiv VV0,Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States),Google (United States),Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States)
+OPENALEX,https://openalex.org/W2084812512,,,UCI Repository of machine learning databases,Medical Entomology and Zoology,,,1998,article,en,10547,['Blake C.'],['Catherine Blake'],[],,[],"['Computer science', 'Database', 'Artificial intelligence']","['Computer science', 'Database', 'Artificial intelligence']",,,,,,Blake 1998 Medical VV0,,,
+OPENALEX,https://openalex.org/W2118020653,10.1145/505282.505283,,Machine learning in automated text categorization,ACM Computing Surveys,,,2002,review,en,7884,['Sebastiani F.'],['Fabrizio Sebastiani'],['Consorzio Pisa Ricerche'],,[],"['Computer science', 'Categorization', 'Software portability', 'Artificial intelligence', 'Classifier (UML)', 'Machine learning', 'Text categorization', 'Natural language processing']","['Computer science', 'Categorization', 'Software portability', 'Artificial intelligence', 'Classifier (UML)', 'Machine learning', 'Text categorization', 'Natural language processing', 'Programming language']",,34,1,1,47,Sebastiani 2002 ACM V34,Consorzio Pisa Ricerche,Consorzio Pisa Ricerche,Consorzio Pisa Ricerche
+OPENALEX,https://openalex.org/W1504694836,,,Programs for Machine Learning,,,,1994,article,en,5804,"['Salzberg S.', 'Segre A.']","['Steven L. Salzberg', 'Alberto M. Segre']",['Johns Hopkins University'],,[],"['Successor cardinal', 'Artificial intelligence', 'Computer science', 'Decision tree', 'Machine learning', 'Subject (documents)', 'ID3 algorithm', 'Decision tree learning', 'Incremental decision tree', 'World Wide Web', 'Mathematics']","['Successor cardinal', 'Artificial intelligence', 'Computer science', 'Decision tree', 'Machine learning', 'Subject (documents)', 'ID3 algorithm', 'Decision tree learning', 'Incremental decision tree', 'World Wide Web', 'Mathematics', 'Mathematical analysis']",,,,,,Salzberg 1994 UNKNOWNJ VV0,Johns Hopkins University,Johns Hopkins University,Johns Hopkins University
+OPENALEX,https://openalex.org/W2271840356,10.48550/arxiv.1603.04467,,TensorFlow: Large-Scale Machine Learning on Heterogeneous Distributed Systems,arXiv (Cornell University),,,2016,preprint,en,9772,"['Abadi M.', 'Agarwal A.', 'Barham P.', 'Brevdo E.', 'Chen Z.', 'Citro C.', 'Corrado G.', 'Davis A.', 'Dean J.', 'Devin M.', 'Ghemawat S.', 'Goodfellow I.', 'Harp A.', 'Irving G.', 'Isard M.', 'Jia Y.', 'Józefowicz R.', 'Kaiser Ł.', 'Kudlur M.', 'Levenberg J.', 'Mané D.', 'Monga R.', 'Moore S.', 'Murray D.', 'Olah C.', 'Schuster M.', 'Shlens J.', 'Steiner B.', 'Sutskever I.', 'Talwar K.', 'Tucker P.', 'Vanhoucke V.', 'Vasudevan V.', 'Viégas F.', 'Vinyals O.', 'Warden P.', 'Wattenberg M.', 'Wicke M.', 'Yu Y.', 'Zheng X.']","['Martı́n Abadi', 'Ashish Agarwal', 'Paul Barham', 'Eugene Brevdo', 'Zhifeng Chen', 'Craig Citro', 'Gregory S. Corrado', 'Andy Davis', 'Jay B. Dean', 'Matthieu Devin', 'Sanjay Ghemawat', 'Ian Goodfellow', 'Andrew Harp', 'Geoffrey Irving', 'Michael Isard', 'Yangqing Jia', 'Rafał Józefowicz', 'Łukasz Kaiser', 'Manjunath Kudlur', 'Josh Levenberg', 'Dan Mané', 'Rajat Monga', 'Sherry Moore', 'Derek G. Murray', 'Chris Olah', 'Mike Schuster', 'Jonathon Shlens', 'Benoit Steiner', 'Ilya Sutskever', 'Kunal Talwar', 'Paul A. Tucker', 'Vincent Vanhoucke', 'Vijay Vasudevan', 'Fernanda Viégas', 'Oriol Vinyals', 'Pete Warden', 'Martin Wattenberg', 'Martin Wicke', 'Yuan Yu', 'Xiaoqiang Zheng']",[],,[],"['Scale (ratio)', 'Computer science', 'Artificial intelligence', 'Machine learning', 'Distributed computing', 'Geography', 'Cartography']","['Scale (ratio)', 'Computer science', 'Artificial intelligence', 'Machine learning', 'Distributed computing', 'Geography', 'Cartography']",,,,,,Abadi 2016 arXiv VV0,,,
+OPENALEX,https://openalex.org/W3163993681,10.1038/s42254-021-00314-5,,Physics-informed machine learning,Nature Reviews Physics,,,2021,review,en,6361,"['Karniadakis G.', 'Kevrekidis I.', 'Lu L.', 'Perdikaris P.', 'Wang S.', 'Yang L.']","['George Em Karniadakis', 'Ioannis G. Kevrekidis', 'Lu Lu', 'Paris Perdikaris', 'Sifan Wang', 'Liu Yang']","['Brown University', 'Johns Hopkins University', 'Massachusetts Institute of Technology', 'University of Pennsylvania', 'Applied Mathematics (United States)', 'University of Pennsylvania', 'Brown University']",,[],"['Computer science', 'Artificial intelligence', 'Machine learning', 'Multiphysics', 'Inference', 'Artificial neural network', 'Physical law', 'Field (mathematics)', 'Discretization', 'Kernel method', 'Deep learning', 'Theoretical computer science', 'Mathematics', 'Support vector machine', 'Finite element method']","['Computer science', 'Artificial intelligence', 'Machine learning', 'Multiphysics', 'Inference', 'Artificial neural network', 'Physical law', 'Field (mathematics)', 'Discretization', 'Kernel method', 'Deep learning', 'Theoretical computer science', 'Mathematics', 'Support vector machine', 'Finite element method', 'Mathematical analysis', 'Philosophy', 'Pure mathematics', 'Physics', 'Epistemology', 'Thermodynamics']",,3,6,422,440,Karniadakis 2021 Nature V3,Brown University;Johns Hopkins University;Massachusetts Institute of Technology;University of Pennsylvania;Applied Mathematics (United States);University of Pennsylvania;Brown University,Brown University,Brown University;Johns Hopkins University;Massachusetts Institute of Technology;University of Pennsylvania;Applied Mathematics (United States);University of Pennsylvania;Brown University
+OPENALEX,https://openalex.org/W1601795611,10.1108/03684920710743466,,Pattern Recognition and Machine Learning,Kybernetes,,,2007,article,en,8434,[],[],[],,[],"['Computer science', 'Cybernetics', 'Artificial intelligence', 'Machine learning']","['Computer science', 'Cybernetics', 'Artificial intelligence', 'Machine learning']",,36,2,275,275,UNKNOWN 2007 Kybernetes V36,,,
+OPENALEX,https://openalex.org/W1534477342,10.1007/3-540-45014-9_1,,Ensemble Methods in Machine Learning,Lecture notes in computer science,,,2000,book-chapter,en,7794,['Dietterich T.'],['Thomas G. Dietterich'],['Oregon State University'],,[],"['Computer science', 'Overfitting', 'Ensemble learning', 'Boosting (machine learning)', 'AdaBoost', 'Artificial intelligence', 'Machine learning', 'Classifier (UML)', 'Bayesian probability', 'Pattern recognition (psychology)', 'Artificial neural network']","['Computer science', 'Overfitting', 'Ensemble learning', 'Boosting (machine learning)', 'AdaBoost', 'Artificial intelligence', 'Machine learning', 'Classifier (UML)', 'Bayesian probability', 'Pattern recognition (psychology)', 'Artificial neural network']",,,,1,15,Dietterich 2000 Lecture VV0,Oregon State University,Oregon State University,Oregon State University
+OPENALEX,https://openalex.org/W2559394418,10.1038/nature23474,28905917,Quantum machine learning,Nature,,,2017,article,en,4376,"['Biamonte J.', 'Wittek P.', 'Pancotti N.', 'Rebentrost P.', 'Wiebe N.', 'Lloyd S.']","['Jacob Biamonte', 'Péter Wittek', 'Nicola Pancotti', 'Patrick Rebentrost', 'Nathan Wiebe', 'Seth Lloyd']","['Skolkovo Institute of Science and Technology', 'Institute of Photonic Sciences', 'Max Planck Institute of Quantum Optics', 'Massachusetts Institute of Technology', 'Microsoft (United States)', 'Massachusetts Institute of Technology']",,[],"['Quantum machine learning', 'Computer science', 'Quantum', 'Software', 'Field (mathematics)', 'Quantum computer', 'Artificial intelligence', 'Computer engineering', 'Programming language', 'Physics', 'Mathematics']","['Quantum machine learning', 'Computer science', 'Quantum', 'Software', 'Field (mathematics)', 'Quantum computer', 'Artificial intelligence', 'Computer engineering', 'Programming language', 'Physics', 'Mathematics', 'Pure mathematics', 'Quantum mechanics']",,549,7671,195,202,Biamonte 2017 Nature V549,Skolkovo Institute of Science and Technology;Institute of Photonic Sciences;Max Planck Institute of Quantum Optics;Massachusetts Institute of Technology;Microsoft (United States);Massachusetts Institute of Technology,Skolkovo Institute of Science and Technology,Skolkovo Institute of Science and Technology;Institute of Photonic Sciences;Max Planck Institute of Quantum Optics;Massachusetts Institute of Technology;Microsoft (United States);Massachusetts Institute of Technology
+OPENALEX,https://openalex.org/W2402144811,10.5555/3026877.3026899,,TensorFlow: a system for large-scale machine learning,Operating Systems Design and Implementation,,,2016,article,en,6353,"['Abadi M.', 'Barham P.', 'Chen J.', 'Chen Z.', 'Davis A.', 'Dean J.', 'Devin M.', 'Ghemawat S.', 'Irving G.', 'Isard M.', 'Kudlur M.', 'Levenberg J.', 'Monga R.', 'Moore S.', 'Murray D.', 'Steiner B.', 'Tucker P.', 'Vasudevan V.', 'Warden P.', 'Wicke M.', 'Yu Y.', 'Zheng X.']","['Martı́n Abadi', 'Paul Barham', 'Jianmin Chen', 'Zhifeng Chen', 'Andy Davis', 'Jay B. Dean', 'Matthieu Devin', 'Sanjay Ghemawat', 'Geoffrey Irving', 'Michael Isard', 'Manjunath Kudlur', 'Josh Levenberg', 'Rajat Monga', 'Sherry Moore', 'Derek G. Murray', 'Benoit Steiner', 'Paul A. Tucker', 'Vijay Vasudevan', 'Pete Warden', 'Martin Wicke', 'Yuan Yu', 'Xiaoqiang Zheng']","['Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)']",,[],"['Dataflow', 'Computer science', 'Artificial intelligence', 'Multi-core processor', 'Machine learning', 'Computer architecture', 'Deep learning', 'Scalability', 'Inference', 'Artificial neural network', 'Dataflow architecture', 'Computation', 'Distributed computing', 'Parallel computing', 'Programming language', 'Operating system']","['Dataflow', 'Computer science', 'Artificial intelligence', 'Multi-core processor', 'Machine learning', 'Computer architecture', 'Deep learning', 'Scalability', 'Inference', 'Artificial neural network', 'Dataflow architecture', 'Computation', 'Distributed computing', 'Parallel computing', 'Programming language', 'Operating system']",,,,265,283,Abadi 2016 Operating VV0,Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States),Google (United States),Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States);Google (United States)
+OPENALEX,https://openalex.org/W2912213068,10.1145/3298981,,Federated Machine Learning,ACM Transactions on Intelligent Systems and Technology,,,2019,article,en,5789,"['Yang Q.', 'Liu Y.', 'Chen T.', 'Tong Y.']","['Qiang Yang', 'Yang Liu', 'Tianjian Chen', 'Yongxin Tong']","['Hong Kong University of Science and Technology', 'Beihang University']",,[],"['Computer science', 'Federated learning', 'Transfer of learning', 'Artificial intelligence', 'Data science', 'Computer security']","['Computer science', 'Federated learning', 'Transfer of learning', 'Artificial intelligence', 'Data science', 'Computer security']",,10,2,1,19,Yang 2019 ACM V10,Hong Kong University of Science and Technology;Beihang University,Hong Kong University of Science and Technology,Hong Kong University of Science and Technology;Beihang University
+OPENALEX,https://openalex.org/W2155653793,10.1016/s0031-3203(96)00142-2,,The use of the area under the ROC curve in the evaluation of machine learning algorithms,Pattern Recognition,,,1997,article,en,7200,['Bradley A.'],['Andrew P. Bradley'],['University of Queensland'],,[],"['Algorithm', 'Receiver operating characteristic', 'Machine learning', 'Artificial intelligence', 'Perceptron', 'Computer science', 'Discriminant', 'Multilayer perceptron', 'Mathematics', 'Artificial neural network']","['Algorithm', 'Receiver operating characteristic', 'Machine learning', 'Artificial intelligence', 'Perceptron', 'Computer science', 'Discriminant', 'Multilayer perceptron', 'Mathematics', 'Artificial neural network']",,30,7,1145,1159,Bradley 1997 Pattern V30,University of Queensland,University of Queensland,University of Queensland
+OPENALEX,https://openalex.org/W2009086942,10.1198/tech.2007.s518,,Pattern Recognition and Machine Learning,Technometrics,,,2007,article,en,4651,['Neal R.'],['Radford M. Neal'],['University of Toronto'],,[],"['Artificial intelligence', 'Computer science', 'Machine learning', 'Pattern recognition (psychology)']","['Artificial intelligence', 'Computer science', 'Machine learning', 'Pattern recognition (psychology)']",,49,3,366,366,Neal 2007 Technometrics V49,University of Toronto,University of Toronto,University of Toronto
+OPENALEX,https://openalex.org/W1506806321,,,Pattern Recognition and Machine Learning (Information Science and Statistics),Springer eBooks,,,2006,book,en,8356,['Bishop C.'],['Chris Bishop'],[],,[],"['Artificial intelligence', 'Computer science', 'Statistics', 'Pattern recognition (psychology)', 'Machine learning', 'Mathematics']","['Artificial intelligence', 'Computer science', 'Statistics', 'Pattern recognition (psychology)', 'Machine learning', 'Mathematics']",,,,,,Bishop 2006 Springer VV0,,,
+OPENALEX,https://openalex.org/W2131241448,10.48550/arxiv.1206.2944,,Practical Bayesian Optimization of Machine Learning Algorithms,arXiv (Cornell University),,,2012,preprint,en,5659,"['Snoek J.', 'Larochelle H.', 'Adams R.']","['Jasper Snoek', 'Hugo Larochelle', 'Ryan P. Adams']","['University of Toronto', 'Université de Sherbrooke', 'Harvard University']",,[],"['Bayesian optimization', 'Computer science', 'Bayesian probability', 'Machine learning', 'Artificial intelligence', 'Optimization algorithm', 'Algorithm', 'Mathematical optimization', 'Mathematics']","['Bayesian optimization', 'Computer science', 'Bayesian probability', 'Machine learning', 'Artificial intelligence', 'Optimization algorithm', 'Algorithm', 'Mathematical optimization', 'Mathematics']",,,,,,Snoek 2012 arXiv VV0,University of Toronto;Université de Sherbrooke;Harvard University,University of Toronto,University of Toronto;Université de Sherbrooke;Harvard University
+OPENALEX,https://openalex.org/W2884430236,10.1038/s41586-018-0337-2,30046072,Machine learning for molecular and materials science,Nature,,,2018,review,en,4459,"['Butler K.', 'Davies D.', 'Cartwright H.', 'Isayev O.', 'Walsh A.']","['Keith T. Butler', 'Daniel W. Davies', 'Hugh Cartwright', 'Olexandr Isayev', 'Aron Walsh']","['Research Complex at Harwell', 'Rutherford Appleton Laboratory', 'University of Bath', 'University of Oxford', 'University of North Carolina at Chapel Hill', 'Yonsei University']",,[],"['Computer science', 'Field (mathematics)', 'Data science', 'Characterization (materials science)', 'Domain (mathematical analysis)', 'Artificial intelligence', 'Cognitive science', 'Nanotechnology', 'Machine learning', 'Psychology', 'Materials science']","['Computer science', 'Field (mathematics)', 'Data science', 'Characterization (materials science)', 'Domain (mathematical analysis)', 'Artificial intelligence', 'Cognitive science', 'Nanotechnology', 'Machine learning', 'Psychology', 'Materials science', 'Mathematics', 'Mathematical analysis', 'Pure mathematics']",,559,7715,547,555,Butler 2018 Nature V559,Research Complex at Harwell;Rutherford Appleton Laboratory;University of Bath;University of Oxford;University of North Carolina at Chapel Hill;Yonsei University,Research Complex at Harwell,Research Complex at Harwell;Rutherford Appleton Laboratory;University of Bath;University of Oxford;University of North Carolina at Chapel Hill;Yonsei University
+OPENALEX,https://openalex.org/W2913668833,,,Proceedings of the 25th international conference on Machine learning,,,,2008,article,en,5549,"['Cohen W.', 'McCallum A.', 'Roweis S.']","['William W. Cohen', 'Andrew McCallum', 'Sam T. Roweis']","['Carnegie Mellon University', 'University of Massachusetts Amherst', 'Google (United States)', 'University of Toronto']",,[],"['Presentation (obstetrics)', 'Library science', 'Computer science', 'Medical education', 'Artificial intelligence', 'Medicine']","['Presentation (obstetrics)', 'Library science', 'Computer science', 'Medical education', 'Artificial intelligence', 'Medicine', 'Radiology']",,,,,,Cohen 2008 UNKNOWNJ VV0,Carnegie Mellon University;University of Massachusetts Amherst;Google (United States);University of Toronto,Carnegie Mellon University,Carnegie Mellon University;University of Massachusetts Amherst;Google (United States);University of Toronto
+OPENALEX,https://openalex.org/W2934399013,10.1056/nejmra1814259,30943338,Machine Learning in Medicine,New England Journal of Medicine,,,2019,review,en,3873,"['Rajkomar A.', 'Dean J.', 'Kohane I.']","['Alvin Rajkomar', 'Jay B. Dean', 'Isaac S. Kohane']","['Google (United States)', 'Google (United States)', 'Google (United States)', 'Harvard University']",,[],"['Download', 'Computer science', 'Data science', 'Medicine', 'Medical education', 'Artificial intelligence', 'World Wide Web']","['Download', 'Computer science', 'Data science', 'Medicine', 'Medical education', 'Artificial intelligence', 'World Wide Web']",,380,14,1347,1358,Rajkomar 2019 New V380,Google (United States);Google (United States);Google (United States);Harvard University,Google (United States),Google (United States);Google (United States);Google (United States);Harvard University
+OPENALEX,https://openalex.org/W1485009520,10.48550/arxiv.1506.04214,,Convolutional LSTM Network: A Machine Learning Approach for Precipitation Nowcasting,arXiv (Cornell University),,,2015,preprint,en,6642,"['Shi X.', 'Chen Z.', 'Wang H.', 'Yeung D.', 'Wong W.', 'Woo W.']","['Xingjian Shi', 'Zhourong Chen', 'Hao Wang', 'Dit‐Yan Yeung', 'Wai Kin Wong', 'Wang‐chun Woo']","['Hong Kong University of Science and Technology', 'Hong Kong University of Science and Technology', 'Hong Kong University of Science and Technology', 'Hong Kong University of Science and Technology', 'Hong Kong Observatory', 'Hong Kong Observatory']",,[],"['Nowcasting', 'Computer science', 'Convolutional neural network', 'Artificial intelligence', 'Precipitation', 'State (computer science)', 'Machine learning', 'Perspective (graphical)', 'Pattern recognition (psychology)', 'Algorithm', 'Meteorology', 'Geography']","['Nowcasting', 'Computer science', 'Convolutional neural network', 'Artificial intelligence', 'Precipitation', 'State (computer science)', 'Machine learning', 'Perspective (graphical)', 'Pattern recognition (psychology)', 'Algorithm', 'Meteorology', 'Geography']",,,,,,Shi 2015 arXiv VV0,Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;Hong Kong Observatory;Hong Kong Observatory,Hong Kong University of Science and Technology,Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;Hong Kong University of Science and Technology;Hong Kong Observatory;Hong Kong Observatory
+OPENALEX,https://openalex.org/W2149684865,10.1007/bfb0026683,,Text categorization with Support Vector Machines: Learning with many relevant features,Lecture notes in computer science,,,1998,book-chapter,en,7977,['Joachims T.'],['Thorsten Joachims'],['TU Dortmund University'],,[],"['Support vector machine', 'Computer science', 'Machine learning', 'Artificial intelligence', 'Categorization', 'Text categorization', 'Task (project management)', 'Variety (cybernetics)', 'Empirical research', 'Relevance vector machine', 'Mathematics']","['Support vector machine', 'Computer science', 'Machine learning', 'Artificial intelligence', 'Categorization', 'Text categorization', 'Task (project management)', 'Variety (cybernetics)', 'Empirical research', 'Relevance vector machine', 'Mathematics', 'Statistics', 'Management', 'Economics']",,,,137,142,Joachims 1998 Lecture VV0,TU Dortmund University,TU Dortmund University,TU Dortmund University
+OPENALEX,https://openalex.org/W114517082,10.1007/978-3-7908-2604-3_16,,Large-Scale Machine Learning with Stochastic Gradient Descent,,,,2010,book-chapter,en,5615,['Bottou L.'],['Léon Bottou'],['Princeton University'],,[],"['Stochastic gradient descent', 'Computer science', 'Scale (ratio)', 'Stochastic optimization', 'Gradient descent', 'Set (abstract data type)', 'Online machine learning', 'Context (archaeology)', 'Sample (material)', 'Artificial intelligence', 'Algorithm', 'Mathematical optimization', 'Machine learning', 'Mathematics', 'Active learning (machine learning)', 'Artificial neural network']","['Stochastic gradient descent', 'Computer science', 'Scale (ratio)', 'Stochastic optimization', 'Gradient descent', 'Set (abstract data type)', 'Online machine learning', 'Context (archaeology)', 'Sample (material)', 'Artificial intelligence', 'Algorithm', 'Mathematical optimization', 'Machine learning', 'Mathematics', 'Active learning (machine learning)', 'Artificial neural network', 'Programming language', 'Chromatography', 'Paleontology', 'Physics', 'Chemistry', 'Biology', 'Quantum mechanics']",,,,177,186,Bottou 2010 UNKNOWNJ VV0,Princeton University,Princeton University,Princeton University
+OPENALEX,https://openalex.org/W2945976633,10.1038/s42256-019-0048-x,35603010,Stop explaining black box machine learning models for high stakes decisions and use interpretable models instead,Nature Machine Intelligence,,,2019,article,en,8741,['Rudin C.'],['Cynthia Rudin'],['Duke University'],,[],"['Black box', 'Harm', 'Computer science', 'Key (lock)', 'Criminal justice', 'Artificial intelligence', 'Economic Justice', 'Machine learning', 'Data science', 'Criminology', 'Psychology', 'Computer security', 'Political science', 'Social psychology', 'Law']","['Black box', 'Harm', 'Computer science', 'Key (lock)', 'Criminal justice', 'Artificial intelligence', 'Economic Justice', 'Machine learning', 'Data science', 'Criminology', 'Psychology', 'Computer security', 'Political science', 'Social psychology', 'Law']",,1,5,206,215,Rudin 2019 Nature V1,Duke University,Duke University,Duke University
+OPENALEX,https://openalex.org/W1680797894,10.1007/978-0-387-30164-8,,Encyclopedia of Machine Learning,,,,2010,book,en,3461,"['Sammut C.', 'Webb G.']","['Claude Sammut', 'Geoffrey I. Webb']",['UNSW Sydney'],,[],"['Encyclopedia', 'Computer science', 'Artificial intelligence', 'Data science', 'Library science']","['Encyclopedia', 'Computer science', 'Artificial intelligence', 'Data science', 'Library science']",,,,,,Sammut 2010 UNKNOWNJ VV0,UNSW Sydney,UNSW Sydney,UNSW Sydney
+OPENALEX,https://openalex.org/W3135028703,10.1007/s42979-021-00592-x,33778771,"Machine Learning: Algorithms, Real-World Applications and Research Directions",SN Computer Science,,,2021,review,en,5063,['Sarker I.'],['Iqbal H. Sarker'],"['Chittagong University of Engineering & Technology', 'Swinburne University of Technology']",,[],"['Computer science', 'Artificial intelligence', 'Machine learning', 'Key (lock)', 'Big data', 'Data science', 'Data mining', 'Computer security']","['Computer science', 'Artificial intelligence', 'Machine learning', 'Key (lock)', 'Big data', 'Data science', 'Data mining', 'Computer security']",,2,3,160,160,Sarker 2021 SN V2,Chittagong University of Engineering & Technology;Swinburne University of Technology,Chittagong University of Engineering & Technology,Chittagong University of Engineering & Technology;Swinburne University of Technology
+OPENALEX,https://openalex.org/W1502922572,10.1007/978-3-540-28650-9_4,,Gaussian Processes in Machine Learning,Lecture notes in computer science,,,2004,book-chapter,en,5101,['Rasmussen C.'],['Carl Edward Rasmussen'],['Max Planck Institute for Biological Cybernetics'],,[],"['Computer science', 'Hyperparameter', 'Gaussian process', 'Focus (optics)', 'Machine learning', 'Artificial intelligence', 'Process (computing)', 'Gaussian', 'Marginal likelihood', 'Simple (philosophy)', 'Kriging', 'Marginal distribution', 'Algorithm', 'Mathematical optimization', 'Random variable', 'Statistics', 'Mathematics']","['Computer science', 'Hyperparameter', 'Gaussian process', 'Focus (optics)', 'Machine learning', 'Artificial intelligence', 'Process (computing)', 'Gaussian', 'Marginal likelihood', 'Simple (philosophy)', 'Kriging', 'Marginal distribution', 'Algorithm', 'Mathematical optimization', 'Random variable', 'Statistics', 'Mathematics', 'Philosophy', 'Operating system', 'Optics', 'Bayesian probability', 'Epistemology', 'Physics', 'Quantum mechanics']",,,,63,71,Rasmussen 2004 Lecture VV0,Max Planck Institute for Biological Cybernetics,Max Planck Institute for Biological Cybernetics,Max Planck Institute for Biological Cybernetics
+OPENALEX,https://openalex.org/W2619383789,10.1109/tpami.2018.2798607,29994351,Multimodal Machine Learning: A Survey and Taxonomy,IEEE Transactions on Pattern Analysis and Machine Intelligence,,,2018,article,en,4126,"['Baltrušaitis T.', 'Ahuja C.', 'Morency L.']","['Tadas Baltrušaitis', 'Chaitanya Ahuja', 'Louis–Philippe Morency']","['Microsoft Research (United Kingdom)', 'Carnegie Mellon University', 'Carnegie Mellon University']",,[],"['Multimodal learning', 'Computer science', 'Artificial intelligence', 'Modalities', 'Taxonomy (biology)', 'Categorization', 'Multimodality', 'Field (mathematics)', 'Machine learning', 'Human–computer interaction', 'World Wide Web']","['Multimodal learning', 'Computer science', 'Artificial intelligence', 'Modalities', 'Taxonomy (biology)', 'Categorization', 'Multimodality', 'Field (mathematics)', 'Machine learning', 'Human–computer interaction', 'World Wide Web', 'Pure mathematics', 'Sociology', 'Social science', 'Botany', 'Mathematics', 'Biology']",,41,2,423,443,Baltrušaitis 2018 IEEE V41,Microsoft Research (United Kingdom);Carnegie Mellon University;Carnegie Mellon University,Microsoft Research (United Kingdom),Microsoft Research (United Kingdom);Carnegie Mellon University;Carnegie Mellon University
+OPENALEX,https://openalex.org/W2177870565,10.1161/circulationaha.115.001593,26572668,Machine Learning in Medicine,Circulation,,,2015,review,en,3391,['Deo R.'],['Rahul C. Deo'],['QB3'],,[],"['Medicine', 'Medical physics', 'Medical education', 'Intensive care medicine']","['Medicine', 'Medical physics', 'Medical education', 'Intensive care medicine']",,132,20,1920,1930,Deo 2015 Circulation V132,QB3,QB3,QB3
+OPENALEX,https://openalex.org/W2750384547,10.48550/arxiv.1708.07747,,Fashion-MNIST: a Novel Image Dataset for Benchmarking Machine Learning Algorithms,arXiv (Cornell University),,,2017,preprint,en,6068,"['Han X.', 'Rasul K.', 'Vollgraf R.']","['Xiao, Han', 'Kashif Rasul', 'Roland Vollgraf']",[],,[],"['MNIST database', 'Benchmarking', 'Artificial intelligence', 'Grayscale', 'Computer science', 'Set (abstract data type)', 'Test set', 'Pattern recognition (psychology)', 'Image (mathematics)', 'Machine learning', 'Algorithm', 'Deep learning']","['MNIST database', 'Benchmarking', 'Artificial intelligence', 'Grayscale', 'Computer science', 'Set (abstract data type)', 'Test set', 'Pattern recognition (psychology)', 'Image (mathematics)', 'Machine learning', 'Algorithm', 'Deep learning', 'Programming language', 'Business', 'Marketing']",,,,,,Han 2017 arXiv VV0,,,
+OPENALEX,https://openalex.org/W1873332500,,,Supervised Machine Learning: A Review of Classification Techniques,,,,2007,review,en,4147,['Kotsiantis S.'],['Sotiris Kotsiantis'],['University of Peloponnese'],,[],"['Machine learning', 'Artificial intelligence', 'Computer science', 'Classifier (UML)', 'Supervised learning', 'One-class classification', 'Class (philosophy)', 'Semi-supervised learning', 'Artificial neural network']","['Machine learning', 'Artificial intelligence', 'Computer science', 'Classifier (UML)', 'Supervised learning', 'One-class classification', 'Class (philosophy)', 'Semi-supervised learning', 'Artificial neural network']",,160,3,249,24,Kotsiantis 2007 UNKNOWNJ V160,University of Peloponnese,University of Peloponnese,University of Peloponnese
+OPENALEX,https://openalex.org/W4236362309,10.1017/cbo9781107298019,,Understanding Machine Learning,Cambridge University Press eBooks,,,2014,book,en,2907,"['Shalev‐Shwartz S.', 'Ben-David S.']","['Shai Shalev‐Shwartz', 'Shai Ben-David']","['Hebrew University of Jerusalem', 'University of Waterloo']",,[],"['Computer science', 'Artificial intelligence', 'Stability (learning theory)', 'Algorithmic learning theory', 'Computational learning theory', 'Machine learning', 'Presentation (obstetrics)', 'Stochastic gradient descent', 'Convexity', 'Online machine learning', 'Artificial neural network']","['Computer science', 'Artificial intelligence', 'Stability (learning theory)', 'Algorithmic learning theory', 'Computational learning theory', 'Machine learning', 'Presentation (obstetrics)', 'Stochastic gradient descent', 'Convexity', 'Online machine learning', 'Artificial neural network', 'Medicine', 'Economics', 'Financial economics', 'Radiology']",,,,,,Shalev‐Shwartz 2014 Cambridge VV0,Hebrew University of Jerusalem;University of Waterloo,Hebrew University of Jerusalem,Hebrew University of Jerusalem;University of Waterloo
+OPENALEX,https://openalex.org/W2560674852,10.1145/1390156,,Proceedings of the 25th international conference on Machine learning - ICML '08,,,,2008,paratext,en,6716,[],[],[],,[],"['Computer science', 'Artificial intelligence']","['Computer science', 'Artificial intelligence']",,,,,,UNKNOWN 2008 UNKNOWNJ VV0,,,
+OPENALEX,https://openalex.org/W3198350258,10.1147/rd.33.0210,,Some Studies in Machine Learning Using the Game of Checkers,IBM Journal of Research and Development,,,1959,article,en,4330,['Samuel A.'],['Arthur L. Samuel'],[],,[],"['Computer science', 'Artificial intelligence', 'Machine learning']","['Computer science', 'Artificial intelligence', 'Machine learning']",,3,3,210,229,Samuel 1959 IBM V3,,,
+OPENALEX,https://openalex.org/W2535690855,10.1109/sp.2017.41,,Membership Inference Attacks Against Machine Learning Models,,,,2017,article,en,4175,"['Shokri R.', 'Stronati M.', 'Song C.', 'Shmatikov V.']","['Reza Shokri', 'Marco Stronati', 'Congzheng Song', 'Vitaly Shmatikov']","['Cornell University', 'Institut national de recherche en informatique et en automatique', 'Cornell University', 'Cornell University']",,[],"['Inference', 'Machine learning', 'Computer science', 'Artificial intelligence', 'Perspective (graphical)', 'Focus (optics)', 'Data modeling', 'Data mining', 'Adversarial system', 'Database']","['Inference', 'Machine learning', 'Computer science', 'Artificial intelligence', 'Perspective (graphical)', 'Focus (optics)', 'Data modeling', 'Data mining', 'Adversarial system', 'Database', 'Optics', 'Physics']",,,,3,18,Shokri 2017 UNKNOWNJ VV0,Cornell University;Institut national de recherche en informatique et en automatique;Cornell University;Cornell University,Cornell University,Cornell University;Institut national de recherche en informatique et en automatique;Cornell University;Cornell University
+OPENALEX,https://openalex.org/W2885770726,10.3390/s18082674,30110960,Machine Learning in Agriculture: A Review,Sensors,,,2018,review,en,2977,"['Λιάκος Κ.', 'Busato P.', 'Moshou D.', 'Pearson S.', 'Bochtis D.']","['Κωνσταντίνος Λιάκος', 'Patrizia Busato', 'Dimitrios Moshou', 'Simon Pearson', 'Dionysis Bochtis']","['Centre for Research and Technology Hellas', 'University of Turin', 'Aristotle University of Thessaloniki', 'Centre for Research and Technology Hellas', 'University of Lincoln', 'Centre for Research and Technology Hellas']",,[],"['Agriculture', 'Artificial intelligence', 'Precision agriculture', 'Computer science', 'Machine learning', 'Big data', 'Livestock', 'Decision support system', 'Data science', 'Data mining']","['Agriculture', 'Artificial intelligence', 'Precision agriculture', 'Computer science', 'Machine learning', 'Big data', 'Livestock', 'Decision support system', 'Data science', 'Data mining', 'Biology', 'Ecology']",,18,8,2674,2674,Λιάκος 2018 Sensors V18,Centre for Research and Technology Hellas;University of Turin;Aristotle University of Thessaloniki;Centre for Research and Technology Hellas;University of Lincoln;Centre for Research and Technology Hellas,Centre for Research and Technology Hellas,Centre for Research and Technology Hellas;University of Turin;Aristotle University of Thessaloniki;Centre for Research and Technology Hellas;University of Lincoln;Centre for Research and Technology Hellas
+OPENALEX,https://openalex.org/W1532362218,10.1007/11744023_34,,Machine Learning for High-Speed Corner Detection,Lecture notes in computer science,,,2006,book-chapter,en,4371,"['Rosten E.', 'Drummond T.']","['Edward Rosten', 'Tom Drummond']","['University of Cambridge', 'University of Cambridge']",,[],"['Detector', 'Scale-invariant feature transform', 'Computer science', 'Frame rate', 'Artificial intelligence', 'Corner detection', 'Frame (networking)', 'Feature (linguistics)', 'Computer vision', 'Process (computing)', 'Speedup', 'Feature extraction', 'Pattern recognition (psychology)', 'Image (mathematics)', 'Telecommunications']","['Detector', 'Scale-invariant feature transform', 'Computer science', 'Frame rate', 'Artificial intelligence', 'Corner detection', 'Frame (networking)', 'Feature (linguistics)', 'Computer vision', 'Process (computing)', 'Speedup', 'Feature extraction', 'Pattern recognition (psychology)', 'Image (mathematics)', 'Telecommunications', 'Operating system', 'Philosophy', 'Linguistics']",,,,430,443,Rosten 2006 Lecture VV0,University of Cambridge;University of Cambridge,University of Cambridge,University of Cambridge;University of Cambridge
+OPENALEX,https://openalex.org/W2588003345,10.1371/journal.pone.0169748,28207752,SoilGrids250m: Global gridded soil information based on machine learning,PLoS ONE,,,2017,article,en,4623,"['Hengl T.', 'Jesus J.', 'Heuvelink G.', 'González M.', 'Kilibarda M.', 'Blagotić A.', 'Shangguan W.', 'Wright M.', 'Geng X.', 'Bauer-Marschallinger B.', 'Guevara M.', 'Vargas R.', 'MacMillan R.', 'Batjes N.', 'Leenaars J.', 'Ribeiro E.', 'Wheeler I.', 'Mantel S.', 'Kempen B.']","['Tomislav Hengl', 'Jorge Mendes de Jesus', 'G.B.M. Heuvelink', 'M. Ruiperez González', 'Milan Kilibarda', 'Aleksandar Blagotić', 'Wei Shangguan', 'Marvin N. Wright', 'Xiaoyuan Geng', 'Bernhard Bauer-Marschallinger', 'Mário Guevara', 'Rodrigo Vargas', 'R.A. MacMillan', 'N.H. Batjes', 'J.G.B. Leenaars', 'Eloi Ribeiro', 'Ichsani Wheeler', 'S. Mantel', 'Bas Kempen']","['ISRIC - World Soil Information', 'ISRIC - World Soil Information', 'ISRIC - World Soil Information', 'ISRIC - World Soil Information', 'University of Belgrade', 'Sun Yat-sen University', 'Institut für Medizinische Informatik, Biometrie und Epidemiologie', 'Agriculture and Agri-Food Canada', 'TU Wien', 'University of Delaware', 'University of Delaware', 'ISRIC - World Soil Information', 'ISRIC - World Soil Information', 'ISRIC - World Soil Information', 'ISRIC - World Soil Information', 'ISRIC - World Soil Information']",,[],"['Random forest', 'Landform', 'Soil texture', 'Gradient boosting', 'Soil science', 'Environmental science', 'Soil map', 'Shuttle Radar Topography Mission', 'Ensemble learning', 'Spatial variability', 'Standard deviation', 'Land cover', 'Computer science', 'Remote sensing', 'Artificial intelligence', 'Cartography', 'Mathematics', 'Land use', 'Digital elevation model', 'Statistics', 'Geology', 'Soil water']","['Random forest', 'Landform', 'Soil texture', 'Gradient boosting', 'Soil science', 'Environmental science', 'Soil map', 'Shuttle Radar Topography Mission', 'Ensemble learning', 'Spatial variability', 'Standard deviation', 'Land cover', 'Computer science', 'Remote sensing', 'Artificial intelligence', 'Cartography', 'Mathematics', 'Land use', 'Digital elevation model', 'Statistics', 'Geology', 'Soil water', 'Geography', 'Engineering', 'Civil engineering']",,12,2,e0169748,e0169748,Hengl 2017 PLoS V12,"ISRIC - World Soil Information;ISRIC - World Soil Information;ISRIC - World Soil Information;ISRIC - World Soil Information;University of Belgrade;Sun Yat-sen University;Institut für Medizinische Informatik, Biometrie und Epidemiologie;Agriculture and Agri-Food Canada;TU Wien;University of Delaware;University of Delaware;ISRIC - World Soil Information;ISRIC - World Soil Information;ISRIC - World Soil Information;ISRIC - World Soil Information;ISRIC - World Soil Information",ISRIC - World Soil Information,"ISRIC - World Soil Information;ISRIC - World Soil Information;ISRIC - World Soil Information;ISRIC - World Soil Information;University of Belgrade;Sun Yat-sen University;Institut für Medizinische Informatik, Biometrie und Epidemiologie;Agriculture and Agri-Food Canada;TU Wien;University of Delaware;University of Delaware;ISRIC - World Soil Information;ISRIC - World Soil Information;ISRIC - World Soil Information;ISRIC - World Soil Information;ISRIC - World Soil Information"
+OPENALEX,https://openalex.org/W3153990350,10.1007/s12525-021-00475-2,,Machine learning and deep learning,Electronic Markets,,,2021,article,en,2443,"['Janiesch C.', 'Zschech P.', 'Heinrich K.']","['Christian Janiesch', 'Patrick Zschech', 'Kai Heinrich']","['University of Würzburg', 'Friedrich-Alexander-Universität Erlangen-Nürnberg', 'Otto-von-Guericke-Universität Magdeburg']",,[],"['Deep learning', 'Field (mathematics)', 'Process (computing)', 'Underpinning', 'Artificial neural network', 'Instance-based learning', 'Hyper-heuristic', 'Computational learning theory']","['Artificial intelligence', 'Machine learning', 'Deep learning', 'Computer science', 'Field (mathematics)', 'Process (computing)', 'Underpinning', 'Artificial neural network', 'Instance-based learning', 'Hyper-heuristic', 'Computational learning theory', 'Robot learning', 'Convolutional neural network', 'Intelligent decision support system', 'Deep neural networks', 'Active learning (machine learning)', 'Model building', 'Algorithmic learning theory', 'Deep belief network', 'Unsupervised learning', 'Data modeling', 'Big data', 'Applications of artificial intelligence']",,31,3,685,695,Janiesch 2021 Electronic V31,University of Würzburg;Friedrich-Alexander-Universität Erlangen-Nürnberg;Otto-von-Guericke-Universität Magdeburg,University of Würzburg,University of Würzburg;Friedrich-Alexander-Universität Erlangen-Nürnberg;Otto-von-Guericke-Universität Magdeburg
+OPENALEX,https://openalex.org/W1495061682,,,Correlation-based Feature Selection for Machine Learning,,,,1998,article,en,3502,['Hall M.'],['Mark Hall'],[],,[],"['Artificial intelligence', 'Feature selection', 'Machine learning', 'Feature (linguistics)', 'Computer science', 'Pattern recognition (psychology)', 'Heuristic', 'Naive Bayes classifier', 'Relevance (law)', 'Correlation', 'Set (abstract data type)', 'Decision tree', 'Data mining', 'Support vector machine', 'Mathematics']","['Artificial intelligence', 'Feature selection', 'Machine learning', 'Feature (linguistics)', 'Computer science', 'Pattern recognition (psychology)', 'Heuristic', 'Naive Bayes classifier', 'Relevance (law)', 'Correlation', 'Set (abstract data type)', 'Decision tree', 'Data mining', 'Support vector machine', 'Mathematics', 'Political science', 'Geometry', 'Law', 'Philosophy', 'Programming language', 'Linguistics']",,,,,,Hall 1998 UNKNOWNJ VV0,,,
+OPENALEX,https://openalex.org/W2594183968,10.1039/c7sc02664a,29629118,MoleculeNet: a benchmark for molecular machine learning,Chemical Science,,,2017,article,en,2910,"['Wu Z.', 'Ramsundar B.', 'Feinberg E.', 'Gomes J.', 'Geniesse C.', 'Pappu A.', 'Leswing K.', 'Pande V.']","['Zhenqin Wu', 'Bharath Ramsundar', 'Evan N. Feinberg', 'Joseph Gomes', 'Caleb Geniesse', 'Aneesh Pappu', 'Karl Leswing', 'Vijay S. Pande']","['Stanford Medicine', 'Stanford University', 'Stanford Medicine', 'Stanford University', 'Stanford Medicine', 'Stanford Medicine', 'Stanford University', 'Stanford Medicine', 'Stanford Medicine', 'Stanford University', 'Schrodinger (United States)', 'Stanford Medicine', 'Stanford University']",,[],"['Benchmark (surveying)', 'Computer science', 'Machine learning', 'Artificial intelligence', 'Scale (ratio)', 'Physics', 'Geography']","['Benchmark (surveying)', 'Computer science', 'Machine learning', 'Artificial intelligence', 'Scale (ratio)', 'Physics', 'Geography', 'Geodesy', 'Quantum mechanics']",,9,2,513,530,Wu 2017 Chemical V9,Stanford Medicine;Stanford University;Stanford Medicine;Stanford University;Stanford Medicine;Stanford Medicine;Stanford University;Stanford Medicine;Stanford Medicine;Stanford University;Schrodinger (United States);Stanford Medicine;Stanford University,Stanford Medicine,Stanford Medicine;Stanford University;Stanford Medicine;Stanford University;Stanford Medicine;Stanford Medicine;Stanford University;Stanford Medicine;Stanford Medicine;Stanford University;Schrodinger (United States);Stanford Medicine;Stanford University
+OPENALEX,https://openalex.org/W2040884411,10.1016/s0004-3702(97)00063-5,,Selection of relevant features and examples in machine learning,Artificial Intelligence,,,1997,article,en,3293,"['Blum A.', 'Langley P.']","['Avrim Blum', 'Pat Langley']","['Carnegie Mellon University', 'Institute for the Study of Learning and Expertise', 'Daimler (United States)']",,[],"['Computer science', 'Machine learning', 'Artificial intelligence', 'Focus (optics)', 'Key (lock)', 'Selection (genetic algorithm)', 'Feature selection', 'Work (physics)', 'Data science', 'Engineering']","['Computer science', 'Machine learning', 'Artificial intelligence', 'Focus (optics)', 'Key (lock)', 'Selection (genetic algorithm)', 'Feature selection', 'Work (physics)', 'Data science', 'Engineering', 'Computer security', 'Physics', 'Mechanical engineering', 'Optics']",,97,1-2,245,271,Blum 1997 Artificial V97,Carnegie Mellon University;Institute for the Study of Learning and Expertise;Daimler (United States),Carnegie Mellon University,Carnegie Mellon University;Institute for the Study of Learning and Expertise;Daimler (United States)
+OPENALEX,https://openalex.org/W2594475271,10.48550/arxiv.1702.08608,,Towards A Rigorous Science of Interpretable Machine Learning,arXiv (Cornell University),,,2017,preprint,en,3136,"['Doshi‐Velez F.', 'Kim B.']","['Finale Doshi‐Velez', 'Been Kim']",[],,[],"['Interpretability', 'Artificial intelligence', 'Machine learning', 'Computer science', 'Taxonomy (biology)', 'Position paper']","['Interpretability', 'Artificial intelligence', 'Machine learning', 'Computer science', 'Taxonomy (biology)', 'Position paper', 'Biology', 'Botany', 'World Wide Web']",,,,,,Doshi‐Velez 2017 arXiv VV0,,,
+OPENALEX,https://openalex.org/W2007339694,10.1109/msp.2012.2211477,,The MNIST Database of Handwritten Digit Images for Machine Learning Research [Best of the Web],IEEE Signal Processing Magazine,,,2012,article,en,4581,['Deng L.'],['Li Deng'],['Microsoft (United States)'],,[],"['MNIST database', 'Computer science', 'Optical character recognition', 'Artificial intelligence', 'Handwriting recognition', 'Numerical digit', 'Digit recognition', 'Character (mathematics)', 'Intelligent word recognition', 'Deep learning', 'Character recognition', 'Pattern recognition (psychology)', 'Speech recognition', 'Intelligent character recognition', 'Natural language processing', 'Image (mathematics)', 'Feature extraction', 'Artificial neural network', 'Arithmetic', 'Mathematics']","['MNIST database', 'Computer science', 'Optical character recognition', 'Artificial intelligence', 'Handwriting recognition', 'Numerical digit', 'Digit recognition', 'Character (mathematics)', 'Intelligent word recognition', 'Deep learning', 'Character recognition', 'Pattern recognition (psychology)', 'Speech recognition', 'Intelligent character recognition', 'Natural language processing', 'Image (mathematics)', 'Feature extraction', 'Artificial neural network', 'Arithmetic', 'Mathematics', 'Geometry']",,29,6,141,142,Deng 2012 IEEE V29,Microsoft (United States),Microsoft (United States),Microsoft (United States)
+OPENALEX,https://openalex.org/W607505555,10.1017/cbo9781107298019,,Understanding Machine Learning: From Theory To Algorithms,,,,2015,book,en,3088,"['Shalev‐Shwartz S.', 'Ben-David S.']","['Shai Shalev‐Shwartz', 'Shai Ben-David']","['Hebrew University of Jerusalem', 'University of Waterloo']",,[],"['Computer science', 'Artificial intelligence', 'Field (mathematics)', 'Machine learning', 'Computational learning theory', 'Stability (learning theory)', 'Algorithmic learning theory', 'Stochastic gradient descent', 'Algorithm', 'Presentation (obstetrics)', 'Convexity', 'Online machine learning', 'Artificial neural network', 'Mathematics']","['Computer science', 'Artificial intelligence', 'Field (mathematics)', 'Machine learning', 'Computational learning theory', 'Stability (learning theory)', 'Algorithmic learning theory', 'Stochastic gradient descent', 'Algorithm', 'Presentation (obstetrics)', 'Convexity', 'Online machine learning', 'Artificial neural network', 'Mathematics', 'Radiology', 'Pure mathematics', 'Economics', 'Medicine', 'Financial economics']",,,,,,Shalev‐Shwartz 2015 UNKNOWNJ VV0,Hebrew University of Jerusalem;University of Waterloo,Hebrew University of Jerusalem,Hebrew University of Jerusalem;University of Waterloo
+OPENALEX,https://openalex.org/W2115252128,10.5555/1577069.1755843,,Dlib-ml: A Machine Learning Toolkit,,,,2009,article,en,2921,['King D.'],['Davis E. King'],[],,[],"['Computer science', 'Python (programming language)', 'Debugging', 'Machine learning', 'Cluster analysis', 'Implementation', 'Programming language', 'Artificial intelligence', 'Software engineering', 'Documentation', 'Software', 'Data mining']","['Computer science', 'Python (programming language)', 'Debugging', 'Machine learning', 'Cluster analysis', 'Implementation', 'Programming language', 'Artificial intelligence', 'Software engineering', 'Documentation', 'Software', 'Data mining']",,10,60,1755,1758,King 2009 UNKNOWNJ V10,,,
+OPENALEX,https://openalex.org/W4400134761,10.21275/art20203995,,Machine Learning Algorithms - A Review,International Journal of Science and Research (IJSR),,,2020,review,en,2452,['Mahesh B.'],['Batta Mahesh'],[],,[],"['Computer science', 'Machine learning', 'Artificial intelligence', 'Algorithm']","['Computer science', 'Machine learning', 'Artificial intelligence', 'Algorithm']",,9,1,381,386,Mahesh 2020 International V9,,,
+OPENALEX,https://openalex.org/W2161336914,10.1145/2347736.2347755,,A few useful things to know about machine learning,Communications of the ACM,,,2012,article,en,3232,['Domingos P.'],['Pedro Domingos'],"['University of Washington', 'Seattle University']",,[],"['Computer science', 'Need to know', 'Artificial intelligence', 'Machine learning', 'Computer security']","['Computer science', 'Need to know', 'Artificial intelligence', 'Machine learning', 'Computer security']",,55,10,78,87,Domingos 2012 Communications V55,University of Washington;Seattle University,University of Washington,University of Washington;Seattle University
+OPENALEX,https://openalex.org/W3045004532,10.1016/j.neucom.2020.07.061,,On hyperparameter optimization of machine learning algorithms: Theory and practice,Neurocomputing,,,2020,article,en,3107,"['Yang L.', 'Shami A.']","['Li Yang', 'Abdallah Shami']","['Western University', 'Western University']",,[],"['Hyperparameter', 'Computer science', 'Machine learning', 'Algorithm', 'Artificial intelligence', 'Optimization algorithm', 'Mathematical optimization', 'Mathematics']","['Hyperparameter', 'Computer science', 'Machine learning', 'Algorithm', 'Artificial intelligence', 'Optimization algorithm', 'Mathematical optimization', 'Mathematics']",,415,,295,316,Yang 2020 Neurocomputing V415,Western University;Western University,Western University,Western University;Western University
+OPENALEX,https://openalex.org/W2937307539,10.1038/s41573-019-0024-5,30976107,Applications of machine learning in drug discovery and development,Nature Reviews Drug Discovery,,,2019,review,en,2898,"['Vamathevan J.', 'Clark D.', 'Czodrowski P.', 'Dunham I.', 'Ferrán E.', 'Lee G.', 'Li B.', 'Madabhushi A.', 'Shah P.', 'Spitzer M.', 'Zhao S.']","['Jessica Vamathevan', 'Dominic A. Clark', 'Paul Czodrowski', 'Ian Dunham', 'Edgardo A. Ferrán', 'George Lee', 'Bin Li', 'Anant Madabhushi', 'Parantu K. Shah', 'Michaela Spitzer', 'Shanrong Zhao']","['European Bioinformatics Institute', 'Bioinformatics Institute', 'European Bioinformatics Institute', 'TU Dortmund University', 'European Bioinformatics Institute', 'Open Targets', 'European Bioinformatics Institute', 'Bristol-Myers Squibb (United States)', 'Takeda (United States)', 'Louis Stokes Cleveland VA Medical Center', 'Case Western Reserve University', 'Ono Pharmaceutical (United States)', 'European Bioinformatics Institute', 'Open Targets', 'Pfizer (United States)']",,[],"['Computer science', 'Machine learning', 'Interpretability', 'Drug discovery', 'Artificial intelligence', 'Pipeline (software)', 'Identification (biology)', 'Context (archaeology)', 'Data science', 'Field (mathematics)', 'Drug development', 'Process (computing)', 'Data mining', 'Drug', 'Bioinformatics', 'Medicine']","['Computer science', 'Machine learning', 'Interpretability', 'Drug discovery', 'Artificial intelligence', 'Pipeline (software)', 'Identification (biology)', 'Context (archaeology)', 'Data science', 'Field (mathematics)', 'Drug development', 'Process (computing)', 'Data mining', 'Drug', 'Bioinformatics', 'Medicine', 'Psychiatry', 'Mathematics', 'Programming language', 'Pure mathematics', 'Biology', 'Operating system', 'Paleontology', 'Botany']",,18,6,463,477,Vamathevan 2019 Nature V18,European Bioinformatics Institute;Bioinformatics Institute;European Bioinformatics Institute;TU Dortmund University;European Bioinformatics Institute;Open Targets;European Bioinformatics Institute;Bristol-Myers Squibb (United States);Takeda (United States);Louis Stokes Cleveland VA Medical Center;Case Western Reserve University;Ono Pharmaceutical (United States);European Bioinformatics Institute;Open Targets;Pfizer (United States),European Bioinformatics Institute,European Bioinformatics Institute;Bioinformatics Institute;European Bioinformatics Institute;TU Dortmund University;European Bioinformatics Institute;Open Targets;European Bioinformatics Institute;Bristol-Myers Squibb (United States);Takeda (United States);Louis Stokes Cleveland VA Medical Center;Case Western Reserve University;Ono Pharmaceutical (United States);European Bioinformatics Institute;Open Targets;Pfizer (United States)
+OPENALEX,https://openalex.org/W2151591509,10.3389/fninf.2014.00014,24600388,Machine learning for neuroimaging with scikit-learn,Frontiers in Neuroinformatics,,,2014,article,en,2627,"['Abraham A.', 'Pedregosa F.', 'Eickenberg M.', 'Gervais P.', 'Mueller A.', 'Kossaifi J.', 'Gramfort A.', 'Thirion B.', 'Varoquaux G.']","['Alexandre Abraham', 'Fabian Pedregosa', 'Michael Eickenberg', 'Philippe Gervais', 'Andreas Mueller', 'Jean Kossaifi', 'Alexandre Gramfort', 'Bertrand Thirion', 'Gaël Varoquaux']","['Institut national de recherche en sciences et technologies du numérique', ""Commissariat à l'Énergie Atomique et aux Énergies Alternatives"", 'Centre Inria de Saclay', 'CEA Paris-Saclay', 'Institut national de recherche en sciences et technologies du numérique', ""Commissariat à l'Énergie Atomique et aux Énergies Alternatives"", 'Centre Inria de Saclay', 'CEA Paris-Saclay', 'Institut national de recherche en sciences et technologies du numérique', ""Commissariat à l'Énergie Atomique et aux Énergies Alternatives"", 'Centre Inria de Saclay', 'CEA Paris-Saclay', 'Institut national de recherche en sciences et technologies du numérique', ""Commissariat à l'Énergie Atomique et aux Énergies Alternatives"", 'Centre Inria de Saclay', 'CEA Paris-Saclay', 'University of Bonn', 'Imperial College London', 'Télécom Paris', 'Centre National de la Recherche Scientifique', 'Institut national de recherche en sciences et technologies du numérique', 'Institut Mines-Télécom', ""Commissariat à l'Énergie Atomique et aux Énergies Alternatives"", 'Centre Inria de Saclay', 'CEA Paris-Saclay', 'Laboratoire Traitement et Communication de l’Information', 'Institut national de recherche en sciences et technologies du numérique', ""Commissariat à l'Énergie Atomique et aux Énergies Alternatives"", 'Centre Inria de Saclay', 'CEA Paris-Saclay', 'Institut national de recherche en sciences et technologies du numérique', ""Commissariat à l'Énergie Atomique et aux Énergies Alternatives"", 'Centre Inria de Saclay', 'CEA Paris-Saclay']",,[],"['Neuroimaging', 'Computer science', 'Artificial intelligence', 'Unsupervised learning', 'Machine learning', 'Python (programming language)', 'Functional neuroimaging', 'Pattern recognition (psychology)', 'Psychology', 'Neuroscience']","['Neuroimaging', 'Computer science', 'Artificial intelligence', 'Unsupervised learning', 'Machine learning', 'Python (programming language)', 'Functional neuroimaging', 'Pattern recognition (psychology)', 'Psychology', 'Neuroscience', 'Operating system']",,8,,14,14,Abraham 2014 Frontiers V8,Institut national de recherche en sciences et technologies du numérique;Commissariat à l'Énergie Atomique et aux Énergies Alternatives;Centre Inria de Saclay;CEA Paris-Saclay;Institut national de recherche en sciences et technologies du numérique;Commissariat à l'Énergie Atomique et aux Énergies Alternatives;Centre Inria de Saclay;CEA Paris-Saclay;Institut national de recherche en sciences et technologies du numérique;Commissariat à l'Énergie Atomique et aux Énergies Alternatives;Centre Inria de Saclay;CEA Paris-Saclay;Institut national de recherche en sciences et technologies du numérique;Commissariat à l'Énergie Atomique et aux Énergies Alternatives;Centre Inria de Saclay;CEA Paris-Saclay;University of Bonn;Imperial College London;Télécom Paris;Centre National de la Recherche Scientifique;Institut national de recherche en sciences et technologies du numérique;Institut Mines-Télécom;Commissariat à l'Énergie Atomique et aux Énergies Alternatives;Centre Inria de Saclay;CEA Paris-Saclay;Laboratoire Traitement et Communication de l’Information;Institut national de recherche en sciences et technologies du numérique;Commissariat à l'Énergie Atomique et aux Énergies Alternatives;Centre Inria de Saclay;CEA Paris-Saclay;Institut national de recherche en sciences et technologies du numérique;Commissariat à l'Énergie Atomique et aux Énergies Alternatives;Centre Inria de Saclay;CEA Paris-Saclay,Institut national de recherche en sciences et technologies du numérique,Institut national de recherche en sciences et technologies du numérique;Commissariat à l'Énergie Atomique et aux Énergies Alternatives;Centre Inria de Saclay;CEA Paris-Saclay;Institut national de recherche en sciences et technologies du numérique;Commissariat à l'Énergie Atomique et aux Énergies Alternatives;Centre Inria de Saclay;CEA Paris-Saclay;Institut national de recherche en sciences et technologies du numérique;Commissariat à l'Énergie Atomique et aux Énergies Alternatives;Centre Inria de Saclay;CEA Paris-Saclay;Institut national de recherche en sciences et technologies du numérique;Commissariat à l'Énergie Atomique et aux Énergies Alternatives;Centre Inria de Saclay;CEA Paris-Saclay;University of Bonn;Imperial College London;Télécom Paris;Centre National de la Recherche Scientifique;Institut national de recherche en sciences et technologies du numérique;Institut Mines-Télécom;Commissariat à l'Énergie Atomique et aux Énergies Alternatives;Centre Inria de Saclay;CEA Paris-Saclay;Laboratoire Traitement et Communication de l’Information;Institut national de recherche en sciences et technologies du numérique;Commissariat à l'Énergie Atomique et aux Énergies Alternatives;Centre Inria de Saclay;CEA Paris-Saclay;Institut national de recherche en sciences et technologies du numérique;Commissariat à l'Énergie Atomique et aux Énergies Alternatives;Centre Inria de Saclay;CEA Paris-Saclay
+OPENALEX,https://openalex.org/W2975634117,10.1038/s41592-019-0582-9,31570887,ilastik: interactive machine learning for (bio)image analysis,Nature Methods,,,2019,review,en,3577,"['Berg S.', 'Kutra D.', 'Kroeger T.', 'Straehle C.', 'Kausler B.', 'Haubold C.', 'Schiegg M.', 'Aleš J.', 'Beier T.', 'Rudy M.', 'Eren K.', 'Cervantes J.', 'Xu B.', 'Beuttenmueller F.', 'Wolny A.', 'Zhang C.', 'Koethe U.', 'Hamprecht F.', 'Kreshuk A.']","['Stuart Berg', 'Dominik Kutra', 'Thorben Kroeger', 'Christoph Straehle', 'Bernhard X. Kausler', 'Carsten Haubold', 'Martin Schiegg', 'Janez Aleš', 'Thorsten Beier', 'Markus Rudy', 'Kemal Eren', 'Jaime I Cervantes', 'Buote Xu', 'Fynn Beuttenmueller', 'Adrian Wolny', 'Chong Zhang', 'Ullrich Koethe', 'Fred A. Hamprecht', 'Anna Kreshuk']","['Janelia Research Campus', 'Heidelberg University', 'European Molecular Biology Laboratory', 'Heidelberg University', 'Heidelberg University', 'Heidelberg University', 'Heidelberg University', 'Heidelberg University', 'Heidelberg University', 'Heidelberg University', 'Heidelberg University', 'Heidelberg University', 'Heidelberg University', 'Heidelberg University', 'Heidelberg University', 'European Molecular Biology Laboratory', 'Heidelberg University', 'Heidelberg University', 'Heidelberg University', 'Heidelberg University', 'European Molecular Biology Laboratory']",,[],"['Computer science', 'Workflow', 'Artificial intelligence', 'Segmentation', 'Machine learning', 'Classifier (UML)', 'Image segmentation', 'Computer vision', 'Pattern recognition (psychology)', 'Database']","['Computer science', 'Workflow', 'Artificial intelligence', 'Segmentation', 'Machine learning', 'Classifier (UML)', 'Image segmentation', 'Computer vision', 'Pattern recognition (psychology)', 'Database']",,16,12,1226,1232,Berg 2019 Nature V16,Janelia Research Campus;Heidelberg University;European Molecular Biology Laboratory;Heidelberg University;Heidelberg University;Heidelberg University;Heidelberg University;Heidelberg University;Heidelberg University;Heidelberg University;Heidelberg University;Heidelberg University;Heidelberg University;Heidelberg University;Heidelberg University;European Molecular Biology Laboratory;Heidelberg University;Heidelberg University;Heidelberg University;Heidelberg University;European Molecular Biology Laboratory,Janelia Research Campus,Janelia Research Campus;Heidelberg University;European Molecular Biology Laboratory;Heidelberg University;Heidelberg University;Heidelberg University;Heidelberg University;Heidelberg University;Heidelberg University;Heidelberg University;Heidelberg University;Heidelberg University;Heidelberg University;Heidelberg University;Heidelberg University;European Molecular Biology Laboratory;Heidelberg University;Heidelberg University;Heidelberg University;Heidelberg University;European Molecular Biology Laboratory
+OPENALEX,https://openalex.org/W2135194391,10.1023/a:1020281327116,,An Introduction to MCMC for Machine Learning,Machine Learning,,,2003,article,en,2407,"['Andrieu C.', 'Freitas N.', 'Douc R.', 'Jordan M.']","['Christophe Andrieu', 'Nando de Freitas', 'Randal Douc', 'Michael I. Jordan']","['University of Bristol', 'University of British Columbia', 'The University of Melbourne', 'University of California, Berkeley']",,[],"['Computer science', 'Markov chain Monte Carlo', 'Monte Carlo method', 'Probabilistic logic', 'Artificial intelligence', 'Machine learning', 'Bayesian probability', 'Mathematics', 'Statistics']","['Computer science', 'Markov chain Monte Carlo', 'Monte Carlo method', 'Probabilistic logic', 'Artificial intelligence', 'Machine learning', 'Bayesian probability', 'Mathematics', 'Statistics']",,50,1-2,5,43,Andrieu 2003 Machine V50,"University of Bristol;University of British Columbia;The University of Melbourne;University of California, Berkeley",University of Bristol,"University of Bristol;University of British Columbia;The University of Melbourne;University of California, Berkeley"
+OPENALEX,https://openalex.org/W2973119841,10.1146/annurev-fluid-010719-060214,,Machine Learning for Fluid Mechanics,Annual Review of Fluid Mechanics,,,2019,article,en,2556,"['Brunton S.', 'Noack B.', 'Koumoutsakos P.']","['Steven L. Brunton', 'Bernd R. Noack', 'Petros Koumoutsakos']","['University of Washington', 'Centre National de la Recherche Scientifique', 'Université Paris-Saclay', ""Laboratoire d'Informatique pour la Mécanique et les Sciences de l'Ingénieur"", 'Technische Universität Berlin', 'ETH Zurich']",,[],"['Fluid mechanics', 'Current (fluid)', 'Field (mathematics)', 'Perspective (graphical)', 'Fluid dynamics', 'Domain (mathematical analysis)']","['Fluid mechanics', 'Computer science', 'Current (fluid)', 'Field (mathematics)', 'Perspective (graphical)', 'Fluid dynamics', 'Artificial intelligence', 'Domain (mathematical analysis)', 'Machine learning', 'Domain knowledge', 'Flow (mathematics)', 'Statistical mechanics', 'Data science', 'Fluid motion']",,52,1,477,508,Brunton 2019 Annual V52,University of Washington;Centre National de la Recherche Scientifique;Université Paris-Saclay;Laboratoire d'Informatique pour la Mécanique et les Sciences de l'Ingénieur;Technische Universität Berlin;ETH Zurich,University of Washington,University of Washington;Centre National de la Recherche Scientifique;Université Paris-Saclay;Laboratoire d'Informatique pour la Mécanique et les Sciences de l'Ingénieur;Technische Universität Berlin;ETH Zurich
+OPENALEX,https://openalex.org/W2111547563,10.1016/j.csbj.2014.11.005,25750696,Machine learning applications in cancer prognosis and prediction,Computational and Structural Biotechnology Journal,,,2014,review,en,3275,"['Κούρου Κ.', 'Exarchos T.', 'Exarchos K.', 'Karamouzis M.', 'Fotiadis D.']","['Κωνσταντίνα Κούρου', 'Themis P. Exarchos', 'Konstantinos Exarchos', 'Michalis V. Karamouzis', 'Dimitrios I. Fotiadis']","['University of Ioannina', 'University of Ioannina', 'FORTH Institute of Molecular Biology and Biotechnology', 'University of Ioannina', 'National and Kapodistrian University of Athens', 'University of Ioannina', 'FORTH Institute of Molecular Biology and Biotechnology']",,[],"['Machine learning', 'Artificial intelligence', 'Computer science', 'Support vector machine', 'Cancer', 'Artificial neural network', 'Bayesian network', 'Clinical Practice', 'Variety (cybernetics)', 'Field (mathematics)', 'Predictive modelling', 'Medicine', 'Mathematics']","['Machine learning', 'Artificial intelligence', 'Computer science', 'Support vector machine', 'Cancer', 'Artificial neural network', 'Bayesian network', 'Clinical Practice', 'Variety (cybernetics)', 'Field (mathematics)', 'Predictive modelling', 'Medicine', 'Mathematics', 'Pure mathematics', 'Internal medicine', 'Family medicine']",,13,,8,17,Κούρου 2014 Computational V13,University of Ioannina;University of Ioannina;FORTH Institute of Molecular Biology and Biotechnology;University of Ioannina;National and Kapodistrian University of Athens;University of Ioannina;FORTH Institute of Molecular Biology and Biotechnology,University of Ioannina,University of Ioannina;University of Ioannina;FORTH Institute of Molecular Biology and Biotechnology;University of Ioannina;National and Kapodistrian University of Athens;University of Ioannina;FORTH Institute of Molecular Biology and Biotechnology
+OPENALEX,https://openalex.org/W2525984666,10.1056/nejmp1606181,,"Predicting the Future — Big Data, Machine Learning, and Clinical Medicine",New England Journal of Medicine,,,2016,article,en,3451,"['Obermeyer Z.', 'Emanuel E.']","['Ziad Obermeyer', 'Ezekiel Emanuel']","['Harvard University', 'University of Pennsylvania']",,[],"['Medicine', 'Machine learning', 'Artificial intelligence', 'Big data', 'Precision medicine', 'Data science', 'Scale-invariant feature transform', 'MEDLINE', 'Medical physics', 'Computer science', 'Pathology', 'Data mining', 'Feature extraction']","['Medicine', 'Machine learning', 'Artificial intelligence', 'Big data', 'Precision medicine', 'Data science', 'Scale-invariant feature transform', 'MEDLINE', 'Medical physics', 'Computer science', 'Pathology', 'Data mining', 'Feature extraction', 'Law', 'Political science']",,375,13,1216,1219,Obermeyer 2016 New V375,Harvard University;University of Pennsylvania,Harvard University,Harvard University;University of Pennsylvania
+OPENALEX,https://openalex.org/W2923537029,10.1103/revmodphys.91.045002,,Machine learning and the physical sciences,Reviews of Modern Physics,,,2019,article,en,2413,"['Carleo G.', 'Cirac J.', 'Cranmer K.', 'Daudet L.', 'Schuld M.', 'Tishby N.', 'Vogt-Maranto L.', 'Zdeborová L.']","['Giuseppe Carleo', 'J. I. Cirac', 'K. Cranmer', 'Laurent Daudet', 'Maria Schuld', 'Naftali Tishby', 'Leslie Vogt-Maranto', 'Lenka Zdeborová']","['Flatiron Health (United States)', 'Flatiron Health (United States)', 'Flatiron Health (United States)', 'Flatiron Health (United States)', 'Flatiron Health (United States)', 'Flatiron Health (United States)', 'Flatiron Health (United States)', 'Flatiron Health (United States)']",,[],"['Physics', 'Field (mathematics)', 'Column (typography)', 'Engineering physics', 'Library science', 'Data science', 'Engineering ethics', 'Mechanical engineering', 'Computer science', 'Engineering', 'Connection (principal bundle)']","['Physics', 'Field (mathematics)', 'Column (typography)', 'Engineering physics', 'Library science', 'Data science', 'Engineering ethics', 'Mechanical engineering', 'Computer science', 'Engineering', 'Connection (principal bundle)', 'Pure mathematics', 'Mathematics']",,91,4,,,Carleo 2019 Reviews V91,Flatiron Health (United States);Flatiron Health (United States);Flatiron Health (United States);Flatiron Health (United States);Flatiron Health (United States);Flatiron Health (United States);Flatiron Health (United States);Flatiron Health (United States),Flatiron Health (United States),Flatiron Health (United States);Flatiron Health (United States);Flatiron Health (United States);Flatiron Health (United States);Flatiron Health (United States);Flatiron Health (United States);Flatiron Health (United States);Flatiron Health (United States)
+OPENALEX,https://openalex.org/W1541288193,10.1023/a:1022602019183,,Genetic Algorithms and Machine Learning,Machine Learning,,,1988,article,en,3023,"['Goldberg D.', 'Holland J.']","['David E. Goldberg', 'John H. Holland']","['University of Alabama', 'University of Michigan–Ann Arbor']",,[],"['Mathematics', 'Artificial intelligence', 'Computer science']","['Mathematics', 'Artificial intelligence', 'Computer science']",,3,2-3,95,99,Goldberg 1988 Machine V3,University of Alabama;University of Michigan–Ann Arbor,University of Alabama,University of Alabama;University of Michigan–Ann Arbor
+OPENALEX,https://openalex.org/W2603766943,10.1145/3052973.3053009,,Practical Black-Box Attacks against Machine Learning,,,,2017,article,en,3465,"['Papernot N.', 'McDaniel P.', 'Goodfellow I.', 'Jha S.', 'Celik Z.', 'Swami A.']","['Nicolas Papernot', 'Patrick McDaniel', 'Ian Goodfellow', 'Somesh Jha', 'Z. Berkay Celik', 'Ananthram Swami']","['Pennsylvania State University', 'Pennsylvania State University', 'OpenAI (United States)', 'University of Wisconsin–Madison', 'Pennsylvania State University', 'DEVCOM Army Research Laboratory']",,[],"['Adversarial system', 'Computer science', 'Adversary', 'Black box', 'Malware', 'Deep neural networks', 'Artificial intelligence', 'Deep learning', 'Machine learning', 'Artificial neural network', 'Adversarial machine learning', 'Threat model', 'Computer security']","['Adversarial system', 'Computer science', 'Adversary', 'Black box', 'Malware', 'Deep neural networks', 'Artificial intelligence', 'Deep learning', 'Machine learning', 'Artificial neural network', 'Adversarial machine learning', 'Threat model', 'Computer security']",,,,506,519,Papernot 2017 UNKNOWNJ VV0,Pennsylvania State University;Pennsylvania State University;OpenAI (United States);University of Wisconsin–Madison;Pennsylvania State University;DEVCOM Army Research Laboratory,Pennsylvania State University,Pennsylvania State University;Pennsylvania State University;OpenAI (United States);University of Wisconsin–Madison;Pennsylvania State University;DEVCOM Army Research Laboratory
+OPENALEX,https://openalex.org/W3200707343,10.1038/s41580-021-00407-0,34518686,A guide to machine learning for biologists,Nature Reviews Molecular Cell Biology,,,2021,review,en,2034,"['Greener J.', 'Kandathil S.', 'Moffat L.', 'Jones D.']","['Joe G. Greener', 'Shaun M. Kandathil', 'Lewis Moffat', 'David T. Jones']","['University College London', 'University College London', 'University College London', 'The London College', 'University College London']",,[],"['Machine learning', 'Artificial intelligence', 'Computer science', 'Biological data', 'Deep learning', 'Artificial neural network', 'Bioinformatics', 'Biology']","['Machine learning', 'Artificial intelligence', 'Computer science', 'Biological data', 'Deep learning', 'Artificial neural network', 'Bioinformatics', 'Biology']",,23,1,40,55,Greener 2021 Nature V23,University College London;University College London;University College London;The London College;University College London,University College London,University College London;University College London;University College London;The London College;University College London
+OPENALEX,https://openalex.org/W2914584698,,,Proceedings of the 23rd international conference on Machine learning,,,,2006,article,en,2592,"['Cohen W.', 'Moore A.']","['William W. Cohen', 'Andrew Moore']",[],,[],"['Presentation (obstetrics)', 'Artificial intelligence', 'Library science', 'Computer science', 'Medical education', 'Medicine']","['Presentation (obstetrics)', 'Artificial intelligence', 'Library science', 'Computer science', 'Medical education', 'Medicine', 'Radiology']",,,,,,Cohen 2006 UNKNOWNJ VV0,,,
+OPENALEX,https://openalex.org/W3116286104,10.3390/e23010018,33375658,Explainable AI: A Review of Machine Learning Interpretability Methods,Entropy,,,2020,review,en,2703,"['Linardatos P.', 'Papastefanopoulos V.', 'Kotsiantis S.']","['Pantelis Linardatos', 'Vasilis Papastefanopoulos', 'Sotiris Kotsiantis']","['University of Patras', 'University of Patras', 'University of Patras']",,[],"['Interpretability', 'Artificial intelligence', 'Computer science', 'Machine learning', 'Ambiguity', 'Field (mathematics)', 'Implementation', 'Black box', 'Management science', 'Data science', 'Software engineering', 'Engineering']","['Interpretability', 'Artificial intelligence', 'Computer science', 'Machine learning', 'Ambiguity', 'Field (mathematics)', 'Implementation', 'Black box', 'Management science', 'Data science', 'Software engineering', 'Engineering', 'Mathematics', 'Pure mathematics', 'Programming language']",,23,1,18,18,Linardatos 2020 Entropy V23,University of Patras;University of Patras;University of Patras,University of Patras,University of Patras;University of Patras;University of Patras
+OPENALEX,https://openalex.org/W2142334564,10.2307/1269742,,"Machine Learning, Neural and Statistical Classification",Technometrics,,,1995,article,en,2191,"['Fulkerson B.', 'Michie D.', 'Spiegelhalter D.', 'Taylor C.']","['Bill Fulkerson', 'D. Michie', 'D. J. Spiegelhalter', 'C. C. W. Taylor']","['John Deere (Germany)', 'University of Cambridge']",,[],"['Machine learning', 'Artificial intelligence', 'Computer science', 'Artificial neural network', 'Statistical learning']","['Machine learning', 'Artificial intelligence', 'Computer science', 'Artificial neural network', 'Statistical learning']",,37,4,459,459,Fulkerson 1995 Technometrics V37,John Deere (Germany);University of Cambridge,John Deere (Germany),John Deere (Germany);University of Cambridge
+OPENALEX,https://openalex.org/W2962727772,,,Automatic differentiation in machine learning: a survey,Maynooth University ePrints and eTheses Archive (Maynooth University),,,2015,article,en,2097,"['Baydin A.', 'Pearlmutter B.', 'Radul A.', 'Siskind J.']","['Atılım Güneş Baydin', 'Barak A. Pearlmutter', 'Alexey Radul', 'Jeffrey Mark Siskind']","['University of Oxford', 'Science Oxford', 'National University of Ireland, Maynooth', 'Massachusetts Institute of Technology', 'Purdue University West Lafayette']",,[],"['Computer science', 'Artificial intelligence', 'Relevance (law)', 'Machine learning', 'Automatic differentiation', 'Differentiable function', 'CLARITY', 'Toolbox', 'Field (mathematics)', 'Algorithmic learning theory', 'Active learning (machine learning)', 'Theoretical computer science', 'Algorithm', 'Programming language', 'Mathematics']","['Computer science', 'Artificial intelligence', 'Relevance (law)', 'Machine learning', 'Automatic differentiation', 'Differentiable function', 'CLARITY', 'Toolbox', 'Field (mathematics)', 'Algorithmic learning theory', 'Active learning (machine learning)', 'Theoretical computer science', 'Algorithm', 'Programming language', 'Mathematics', 'Mathematical analysis', 'Biochemistry', 'Law', 'Computation', 'Pure mathematics', 'Political science', 'Chemistry']",,,,,,Baydin 2015 Maynooth VV0,"University of Oxford;Science Oxford;National University of Ireland, Maynooth;Massachusetts Institute of Technology;Purdue University West Lafayette",University of Oxford,"University of Oxford;Science Oxford;National University of Ireland, Maynooth;Massachusetts Institute of Technology;Purdue University West Lafayette"
+OPENALEX,https://openalex.org/W2594639291,10.5860/choice.44-5091,,Pattern recognition and machine learning,Choice Reviews Online,,,2007,article,en,2688,[],[],[],,[],"['Artificial intelligence', 'Computer science', 'Pattern recognition (psychology)', 'Psychology']","['Artificial intelligence', 'Computer science', 'Pattern recognition (psychology)', 'Psychology']",,44,09,44,5091,UNKNOWN 2007 Choice V44,,,
+OPENALEX,https://openalex.org/W2751318774,10.1142/9789811201967_0001,,Introduction to Machine Learning,Series in machine perception and artificial intelligence,,,2019,book-chapter,en,1659,[],[],[],,[],"['Computer science', 'Artificial intelligence']","['Computer science', 'Artificial intelligence']",,,,1,22,UNKNOWN 2019 Series VV0,,,
+OPENALEX,https://openalex.org/W1505191356,10.1038/nrg3920,25948244,Machine learning applications in genetics and genomics,Nature Reviews Genetics,,,2015,review,en,2010,"['Libbrecht M.', 'Noble W.']","['Maxwell W. Libbrecht', 'William Stafford Noble']","['University of Washington', 'University of Washington']",,[],"['Machine learning', 'Artificial intelligence', 'Computer science', 'Genomics', 'Unsupervised learning', 'Selection (genetic algorithm)', 'Discriminative model', 'Epigenomics', 'Feature selection', 'Genome', 'Biology']","['Machine learning', 'Artificial intelligence', 'Computer science', 'Genomics', 'Unsupervised learning', 'Selection (genetic algorithm)', 'Discriminative model', 'Epigenomics', 'Feature selection', 'Genome', 'Biology', 'Biochemistry', 'Gene expression', 'Gene', 'DNA methylation']",,16,6,321,332,Libbrecht 2015 Nature V16,University of Washington;University of Washington,University of Washington,University of Washington;University of Washington
+OPENALEX,https://openalex.org/W3145506661,10.1007/978-3-030-10546-4_1,,Introduction to Machine Learning,Springer briefs in electrical and computer engineering,,,2019,book-chapter,en,1620,"['Yu F.', 'He Y.']","['F. Richard Yu', 'Ying He']","['Carleton University', 'Carleton University']",,[],"['Computer science', 'Artificial intelligence']","['Computer science', 'Artificial intelligence']",,,,1,13,Yu 2019 Springer VV0,Carleton University;Carleton University,Carleton University,Carleton University;Carleton University
+OPENALEX,https://openalex.org/W4205539948,10.1093/rfs/hhaa009,,Empirical Asset Pricing via Machine Learning,Review of Financial Studies,,,2020,article,en,2188,"['Gu S.', 'Kelly B.', 'Xiu D.']","['Shihao Gu', 'Bryan Kelly', 'Dacheng Xiu']","['University of Chicago', 'Capital University', 'Yale University', 'University of Chicago']",,[],"['Capital asset pricing model', 'Machine learning', 'Computer science', 'Artificial intelligence', 'Artificial neural network', 'Volatility (finance)', 'Market liquidity', 'Econometrics', 'Asset (computer security)', 'TRACE (psycholinguistics)', 'Set (abstract data type)', 'Economics', 'Finance']","['Capital asset pricing model', 'Machine learning', 'Computer science', 'Artificial intelligence', 'Artificial neural network', 'Volatility (finance)', 'Market liquidity', 'Econometrics', 'Asset (computer security)', 'TRACE (psycholinguistics)', 'Set (abstract data type)', 'Economics', 'Finance', 'Linguistics', 'Programming language', 'Philosophy', 'Computer security']",,33,5,2223,2273,Gu 2020 Review V33,University of Chicago;Capital University;Yale University;University of Chicago,University of Chicago,University of Chicago;Capital University;Yale University;University of Chicago
+OPENALEX,https://openalex.org/W1993220166,10.1145/1007730.1007735,,A study of the behavior of several methods for balancing machine learning training data,ACM SIGKDD Explorations Newsletter,,,2004,article,en,4104,"['Batista G.', 'Prati R.', 'Monard M.']","['Gustavo E. A. P. A. Batista', 'Ronaldo C. Prati', 'Maria Carolina Monard']","['Brazilian Society of Computational and Applied Mathematics', 'Brazilian Society of Computational and Applied Mathematics', 'Brazilian Society of Computational and Applied Mathematics']",,[],"['Computer science', 'Class (philosophy)', 'Machine learning', 'Artificial intelligence', 'Sampling (signal processing)', 'Simple random sample', 'Event (particle physics)', 'Data mining', 'Simple (philosophy)']","['Computer science', 'Class (philosophy)', 'Machine learning', 'Artificial intelligence', 'Sampling (signal processing)', 'Simple random sample', 'Event (particle physics)', 'Data mining', 'Simple (philosophy)', 'Population', 'Filter (signal processing)', 'Computer vision', 'Demography', 'Sociology', 'Philosophy', 'Epistemology', 'Physics', 'Quantum mechanics']",,6,1,20,29,Batista 2004 ACM V6,Brazilian Society of Computational and Applied Mathematics;Brazilian Society of Computational and Applied Mathematics;Brazilian Society of Computational and Applied Mathematics,Brazilian Society of Computational and Applied Mathematics,Brazilian Society of Computational and Applied Mathematics;Brazilian Society of Computational and Applied Mathematics;Brazilian Society of Computational and Applied Mathematics
+OPENALEX,https://openalex.org/W2767079719,10.1145/3133956.3133982,,Practical Secure Aggregation for Privacy-Preserving Machine Learning,,,,2017,article,en,3394,"['Bonawitz K.', 'Ivanov V.', 'Kreuter B.', 'Marcedone A.', 'McMahan H.', 'Patel S.', 'Ramage D.', 'Segal A.', 'Seth K.']","['Keith Bonawitz', 'Vladimir Ivanov', 'Ben Kreuter', 'Antonio Marcedone', 'H. Brendan McMahan', 'Sarvar Patel', 'Daniel Ramage', 'Aaron Segal', 'Karn Seth']","['Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Cornell University', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)', 'Google (United States)']",,[],"['Computer science', 'Overhead (engineering)', 'Protocol (science)', 'Universal composability', 'Adversary', 'Computer network', 'Aggregate (composite)', 'Cryptographic protocol', 'Distributed computing', 'Theoretical computer science', 'Cryptography', 'Computer security', 'Operating system']","['Computer science', 'Overhead (engineering)', 'Protocol (science)', 'Universal composability', 'Adversary', 'Computer network', 'Aggregate (composite)', 'Cryptographic protocol', 'Distributed computing', 'Theoretical computer science', 'Cryptography', 'Computer security', 'Operating system', 'Composite material', 'Medicine', 'Alternative medicine', 'Materials science', 'Pathology']",,,,1175,1191,Bonawitz 2017 UNKNOWNJ VV0,Google (United States);Google (United States);Google (United States);Google (United States);Cornell University;Google (United States);Google (United States);Google (United States);Google (United States);Google (United States),Google (United States),Google (United States);Google (United States);Google (United States);Google (United States);Cornell University;Google (United States);Google (United States);Google (United States);Google (United States);Google (United States)
+OPENALEX,https://openalex.org/W3122548859,10.1177/2053951715622512,,How the machine ‘thinks’: Understanding opacity in machine learning algorithms,Big Data & Society,,,2016,article,en,2445,['Burrell J.'],['Jenna Burrell'],"['University of California, Berkeley']",,[],"['Machine learning', 'Computer science', 'Artificial intelligence', 'Credit card fraud', 'Algorithm', 'Audit', 'Opacity', 'Credit card', 'Economics', 'World Wide Web']","['Machine learning', 'Computer science', 'Artificial intelligence', 'Credit card fraud', 'Algorithm', 'Audit', 'Opacity', 'Credit card', 'Economics', 'World Wide Web', 'Management', 'Physics', 'Optics', 'Payment']",,3,1,,,Burrell 2016 Big V3,"University of California, Berkeley",Berkeley,"University of California, Berkeley"
+OPENALEX,https://openalex.org/W2610886376,10.1257/jep.31.2.87,,Machine Learning: An Applied Econometric Approach,The Journal of Economic Perspectives,,,2017,article,en,1863,"['Mullainathan S.', 'Spiess J.']","['Sendhil Mullainathan', 'Jann Spiess']","['Harvard University', 'Harvard University Press']",,[],"['Toolbox', 'Python (programming language)', 'Machine learning', 'Computer science', 'Artificial intelligence', 'Face (sociological concept)', 'Empirical research', 'Mathematics']","['Toolbox', 'Python (programming language)', 'Machine learning', 'Computer science', 'Artificial intelligence', 'Face (sociological concept)', 'Empirical research', 'Mathematics', 'Social science', 'Statistics', 'Programming language', 'Operating system', 'Sociology']",,31,2,87,106,Mullainathan 2017 The V31,Harvard University;Harvard University Press,Harvard University,Harvard University;Harvard University Press
+OPENALEX,https://openalex.org/W1596324102,,,Machine Learning: An Artificial Intelligence Approach,,,,2013,book,en,2639,"['Michalski R.', 'Carbonell J.', 'Mitchell T.']","['Ryszard S. Michalski', 'Jaime G. Carbonell', 'Thomas M. Mitchell']",[],,[],"['Computer science', 'Artificial intelligence', 'Perspective (graphical)', 'Heuristics', 'Machine learning', 'Hyper-heuristic', 'Data science', 'Cognitive science', 'Robot learning', 'Psychology']","['Computer science', 'Artificial intelligence', 'Perspective (graphical)', 'Heuristics', 'Machine learning', 'Hyper-heuristic', 'Data science', 'Cognitive science', 'Robot learning', 'Psychology', 'Robot', 'Mobile robot', 'Operating system']",,,,,,Michalski 2013 UNKNOWNJ VV0,,,
+OPENALEX,https://openalex.org/W1494192115,10.1038/nature14541,26017444,Probabilistic machine learning and artificial intelligence,Nature,,,2015,review,en,1965,['Ghahramani Z.'],['Zoubin Ghahramani'],['University of Cambridge'],,[],"['Artificial intelligence', 'Probabilistic logic', 'Computer science', 'Machine learning', 'Field (mathematics)', 'Principal (computer security)', 'Bayesian probability', 'Statistical model', 'Cognitive robotics', 'Robot']","['Artificial intelligence', 'Probabilistic logic', 'Computer science', 'Machine learning', 'Field (mathematics)', 'Principal (computer security)', 'Bayesian probability', 'Statistical model', 'Cognitive robotics', 'Robot', 'Operating system', 'Pure mathematics', 'Mathematics']",,521,7553,452,459,Ghahramani 2015 Nature V521,University of Cambridge,University of Cambridge,University of Cambridge
+OPENALEX,https://openalex.org/W2791315675,10.1016/j.neucom.2017.11.077,,Feature selection in machine learning: A new perspective,Neurocomputing,,,2018,article,en,2045,"['Cai J.', 'Luo J.', 'Wang S.', 'Yang S.']","['Jie Cai', 'Jiawei Luo', 'Shulin Wang', 'Sheng Yang']","['Hunan University', 'Hunan University', 'Hunan University', 'Hunan University']",,[],"['Feature selection', 'Machine learning', 'Computer science', 'Artificial intelligence', 'Cluster analysis', 'Feature (linguistics)', 'Perspective (graphical)', 'Selection (genetic algorithm)', 'Unsupervised learning', 'Supervised learning', 'Feature learning', 'Data mining', 'Artificial neural network']","['Feature selection', 'Machine learning', 'Computer science', 'Artificial intelligence', 'Cluster analysis', 'Feature (linguistics)', 'Perspective (graphical)', 'Selection (genetic algorithm)', 'Unsupervised learning', 'Supervised learning', 'Feature learning', 'Data mining', 'Artificial neural network', 'Linguistics', 'Philosophy']",,300,,70,79,Cai 2018 Neurocomputing V300,Hunan University;Hunan University;Hunan University;Hunan University,Hunan University,Hunan University;Hunan University;Hunan University;Hunan University
+OPENALEX,https://openalex.org/W2968923792,10.1038/s41524-019-0221-0,,Recent advances and applications of machine learning in solid-state materials science,npj Computational Materials,,,2019,article,en,2366,"['Schmidt J.', 'Marques M.', 'Botti S.', 'Marques M.']","['Jonathan Schmidt', 'Mário R. G. Marques', 'Silvana Botti', 'Miguel A. L. Marques']","['Martin Luther University Halle-Wittenberg', 'Martin Luther University Halle-Wittenberg', 'Friedrich Schiller University Jena', 'Martin Luther University Halle-Wittenberg']",,[],"['Interpretability', 'Toolbox', 'Machine learning', 'Artificial intelligence', 'Computer science', 'Process (computing)', 'Property (philosophy)', 'Point (geometry)', 'Mathematics']","['Interpretability', 'Toolbox', 'Machine learning', 'Artificial intelligence', 'Computer science', 'Process (computing)', 'Property (philosophy)', 'Point (geometry)', 'Mathematics', 'Philosophy', 'Geometry', 'Operating system', 'Epistemology', 'Programming language']",,5,1,,,Schmidt 2019 npj V5,Martin Luther University Halle-Wittenberg;Martin Luther University Halle-Wittenberg;Friedrich Schiller University Jena;Martin Luther University Halle-Wittenberg,Martin Luther University Halle-Wittenberg,Martin Luther University Halle-Wittenberg;Martin Luther University Halle-Wittenberg;Friedrich Schiller University Jena;Martin Luther University Halle-Wittenberg
+OPENALEX,https://openalex.org/W164706946,,,Gaussian Processes for Machine Learning (Adaptive Computation and Machine Learning),The MIT Press eBooks,,,2005,book,en,1865,"['Rasmussen C.', 'Williams C.']","['Carl Edward Rasmussen', 'Christopher K. I. Williams']",[],,[],"['Computer science', 'Computation', 'Artificial intelligence', 'Machine learning', 'Computational learning theory', 'Gaussian process', 'Gaussian', 'Active learning (machine learning)', 'Algorithm', 'Physics']","['Computer science', 'Computation', 'Artificial intelligence', 'Machine learning', 'Computational learning theory', 'Gaussian process', 'Gaussian', 'Active learning (machine learning)', 'Algorithm', 'Physics', 'Quantum mechanics']",,,,,,Rasmussen 2005 The VV0,,,
+OPENALEX,https://openalex.org/W2910705748,10.1073/pnas.1900654116,31619572,"Definitions, methods, and applications in interpretable machine learning",Proceedings of the National Academy of Sciences,,,2019,article,en,2050,"['Murdoch W.', 'Singh C.', 'Kumbier K.', 'Abbasi-Asl R.', 'Yu B.']","['William J. Murdoch', 'Chandan Singh', 'Karl Kumbier', 'Reza Abbasi-Asl', 'Bin Yu']","['University of California, Berkeley', 'University of California, Berkeley', 'University of California, Berkeley', 'Allen Institute for Brain Science', 'University of California, San Francisco', 'Allen Institute', 'University of California, Berkeley', 'University of California, Berkeley']",,[],"['Interpretability', 'Computer science', 'Artificial intelligence', 'Categorization', 'Machine learning', 'Context (archaeology)', 'Interpretation (philosophy)', 'Modularity (biology)', 'Vocabulary', 'Data science', 'Focus (optics)']","['Interpretability', 'Computer science', 'Artificial intelligence', 'Categorization', 'Machine learning', 'Context (archaeology)', 'Interpretation (philosophy)', 'Modularity (biology)', 'Vocabulary', 'Data science', 'Focus (optics)', 'Paleontology', 'Optics', 'Genetics', 'Programming language', 'Linguistics', 'Philosophy', 'Biology', 'Physics']",,116,44,22071,22080,Murdoch 2019 Proceedings V116,"University of California, Berkeley;University of California, Berkeley;University of California, Berkeley;Allen Institute for Brain Science;University of California, San Francisco;Allen Institute;University of California, Berkeley;University of California, Berkeley",Berkeley,"University of California, Berkeley;University of California, Berkeley;University of California, Berkeley;Allen Institute for Brain Science;University of California, San Francisco;Allen Institute;University of California, Berkeley;University of California, Berkeley"
+OPENALEX,https://openalex.org/W2342408547,10.1109/comst.2015.2494502,,A Survey of Data Mining and Machine Learning Methods for Cyber Security Intrusion Detection,IEEE Communications Surveys & Tutorials,,,2015,article,en,3024,"['Buczak A.', 'Guven E.']","['Anna L. Buczak', 'Erhan Guven']","['Johns Hopkins University Applied Physics Laboratory', 'Johns Hopkins University Applied Physics Laboratory']",,[],"['Computer science', 'Intrusion detection system', 'Data mining', 'Relevance (law)', 'Analytics', 'Intrusion', 'Data science', 'Machine learning']","['Computer science', 'Intrusion detection system', 'Data mining', 'Relevance (law)', 'Analytics', 'Intrusion', 'Data science', 'Machine learning', 'Political science', 'Geology', 'Law', 'Geochemistry']",,18,2,1153,1176,Buczak 2015 IEEE V18,Johns Hopkins University Applied Physics Laboratory;Johns Hopkins University Applied Physics Laboratory,Johns Hopkins University Applied Physics Laboratory,Johns Hopkins University Applied Physics Laboratory;Johns Hopkins University Applied Physics Laboratory
+OPENALEX,https://openalex.org/W4213308398,10.1007/978-3-030-05318-5,,Automated Machine Learning,The Springer series on challenges in machine learning,,,2019,book,en,1379,"['Hutter F.', 'Kotthoff L.', 'Vanschoren J.']","['Frank Hutter', 'Lars Kotthoff', 'Joaquin Vanschoren']","['University of Freiburg', 'University of Wyoming', 'Eindhoven University of Technology']",,[],"['Computer science', 'Artificial intelligence', 'Machine learning']","['Computer science', 'Artificial intelligence', 'Machine learning']",,,,,,Hutter 2019 The VV0,University of Freiburg;University of Wyoming;Eindhoven University of Technology,University of Freiburg,University of Freiburg;University of Wyoming;Eindhoven University of Technology
+OPENALEX,https://openalex.org/W2168029744,10.1214/009053607000000677,,Kernel methods in machine learning,The Annals of Statistics,,,2008,article,en,1588,"['Hofmann T.', 'Schölkopf B.', 'Smola A.']","['Thomas Hofmann', 'Bernhard Schölkopf', 'Alexander J. Smola']","['Data61', 'Data61', 'Max Planck Institute for Biological Cybernetics']",,[],"['Reproducing kernel Hilbert space', 'Kernel (algebra)', 'Kernel method', 'Hilbert space', 'Binary classification', 'Range (aeronautics)', 'Kernel embedding of distributions', 'Representer theorem', 'Pattern recognition (psychology)', 'Radial basis function kernel']","['Reproducing kernel Hilbert space', 'Artificial intelligence', 'Machine learning', 'Kernel (algebra)', 'Kernel method', 'Computer science', 'Hilbert space', 'Mathematics', 'Binary classification', 'Range (aeronautics)', 'Kernel embedding of distributions', 'Representer theorem', 'Pattern recognition (psychology)', 'Radial basis function kernel', 'Tree kernel', 'Semi-supervised learning', 'Function (biology)', 'Structured prediction', 'Polynomial kernel', 'Online machine learning', 'Score', 'Support vector machine', 'Algorithm', 'Active learning (machine learning)', 'Nonlinear system', 'Binary number', 'Training set', 'Cover (algebra)', 'Ranging', 'Supervised learning', 'Data point', 'Space (punctuation)']",,36,3,,,Hofmann 2008 The V36,Data61;Data61;Max Planck Institute for Biological Cybernetics,Data61,Data61;Data61;Max Planck Institute for Biological Cybernetics
+OPENALEX,https://openalex.org/W2951278869,10.48550/arxiv.cs/0205070,,Thumbs up? Sentiment Classification using Machine Learning Techniques,ArXiv.org,,,2002,preprint,en,2213,"['Pang B.', 'Lee L.', 'Vaithyanathan S.']","['Bo Pang', 'Lillian Lee', 'Shivakumar Vaithyanathan']","['Cornell University', 'Cornell University', 'IBM Research - Almaden']",,[],"['Naive Bayes classifier', 'Computer science', 'Categorization', 'Artificial intelligence', 'Sentiment analysis', 'Support vector machine', 'Machine learning', 'Principle of maximum entropy', 'Natural language processing']","['Naive Bayes classifier', 'Computer science', 'Categorization', 'Artificial intelligence', 'Sentiment analysis', 'Support vector machine', 'Machine learning', 'Principle of maximum entropy', 'Natural language processing']",,,,,,Pang 2002 ArXiv.org VV0,Cornell University;Cornell University;IBM Research - Almaden,Cornell University,Cornell University;Cornell University;IBM Research - Almaden
+OPENALEX,https://openalex.org/W2982720039,,,UCI Repository of Machine Learning Databases,Medical Entomology and Zoology,,,1996,article,en,2342,['Merz C.'],['Christopher J. Merz'],[],,[],"['Database', 'Computer science', 'Artificial intelligence']","['Database', 'Computer science', 'Artificial intelligence']",,,,,,Merz 1996 Medical VV0,,,
+OPENALEX,https://openalex.org/W2104489082,10.1103/physrevlett.108.058301,22400967,Fast and Accurate Modeling of Molecular Atomization Energies with Machine Learning,Physical Review Letters,,,2012,article,en,2377,"['Rupp M.', 'Tkatchenko A.', 'Müller K.', 'Lilienfeld O.']","['Matthias Rupp', 'Alexandre Tkatchenko', 'Klaus‐Robert Müller', 'O. Anatole von Lilienfeld']","['Technische Universität Berlin', 'University of California, Los Angeles', 'University of California, Los Angeles', 'Fritz Haber Institute of the Max Planck Society', 'Technische Universität Berlin', 'University of California, Los Angeles', 'University of California, Los Angeles', 'Argonne National Laboratory']",,[],"['Computer science', 'Statistical physics', 'Physics']","['Computer science', 'Statistical physics', 'Physics']",,108,5,058301,058301,Rupp 2012 Physical V108,"Technische Universität Berlin;University of California, Los Angeles;University of California, Los Angeles;Fritz Haber Institute of the Max Planck Society;Technische Universität Berlin;University of California, Los Angeles;University of California, Los Angeles;Argonne National Laboratory",Technische Universität Berlin,"Technische Universität Berlin;University of California, Los Angeles;University of California, Los Angeles;Fritz Haber Institute of the Max Planck Society;Technische Universität Berlin;University of California, Los Angeles;University of California, Los Angeles;Argonne National Laboratory"
+OPENALEX,https://openalex.org/W2998506103,10.1016/j.ymssp.2019.106587,,Applications of machine learning to machine fault diagnosis: A review and roadmap,Mechanical Systems and Signal Processing,,,2020,review,en,2653,"['Lei Y.', 'Yang B.', 'Jiang X.', 'Jia F.', 'Li N.', 'Nandi A.']","['Yaguo Lei', 'Bin Yang', 'Xinwei Jiang', 'Feng Jia', 'Naipeng Li', 'Asoke K. Nandi']","[""Xi'an Jiaotong University"", ""Xi'an Jiaotong University"", ""Xi'an Jiaotong University"", ""Xi'an Jiaotong University"", ""Xi'an Jiaotong University"", 'Brunel University of London']",,[],"['Artificial intelligence', 'Machine learning', 'Computer science', 'Bridge (graph theory)', 'Engineering']","['Artificial intelligence', 'Machine learning', 'Computer science', 'Bridge (graph theory)', 'Engineering', 'Medicine', 'Internal medicine']",,138,,106587,106587,Lei 2020 Mechanical V138,Xi'an Jiaotong University;Xi'an Jiaotong University;Xi'an Jiaotong University;Xi'an Jiaotong University;Xi'an Jiaotong University;Brunel University of London,Xi'an Jiaotong University,Xi'an Jiaotong University;Xi'an Jiaotong University;Xi'an Jiaotong University;Xi'an Jiaotong University;Xi'an Jiaotong University;Brunel University of London
+OPENALEX,https://openalex.org/W2792919287,10.1038/nmeth.4642,30100822,Statistics versus machine learning,Nature Methods,,,2018,article,en,1478,"['Bzdok D.', 'Altman N.', 'Krzywinski M.']","['Danilo Bzdok', 'Naomi Altman', 'Martin Krzywinski']","['RWTH Aachen University', 'Pennsylvania State University', ""Canada's Michael Smith Genome Sciences Centre""]",,[],"['Computer science', 'Statistics', 'Computational biology', 'Artificial intelligence', 'Machine learning', 'Biology', 'Mathematics']","['Computer science', 'Statistics', 'Computational biology', 'Artificial intelligence', 'Machine learning', 'Biology', 'Mathematics']",,15,4,233,234,Bzdok 2018 Nature V15,RWTH Aachen University;Pennsylvania State University;Canada's Michael Smith Genome Sciences Centre,RWTH Aachen University,RWTH Aachen University;Pennsylvania State University;Canada's Michael Smith Genome Sciences Centre
+OPENALEX,https://openalex.org/W1590183771,10.1017/cbo9780511804779,,Bayesian Reasoning and Machine Learning,Cambridge University Press eBooks,,,2012,book,en,1650,['Barber D.'],['David Barber'],"['UCL Australia', 'University College London']",,[],"['Toolbox', 'Computer science', 'Artificial intelligence', 'Machine learning', 'Data science', 'Human–computer interaction', 'Programming language']","['Toolbox', 'Computer science', 'Artificial intelligence', 'Machine learning', 'Data science', 'Human–computer interaction', 'Programming language']",,,,,,Barber 2012 Cambridge VV0,UCL Australia;University College London,UCL Australia,UCL Australia;University College London
+OPENALEX,https://openalex.org/W2337082154,10.1038/nphys4035,,Machine learning phases of matter,Nature Physics,,,2017,article,en,1469,"['Carrasquilla J.', 'Melko R.']","['Juan Carrasquilla', 'Roger G. Melko']","['Perimeter Institute', 'University of Waterloo', 'Perimeter Institute']",,[],"['Physics', 'Artificial neural network', 'Locality', 'Artificial intelligence', 'Convolutional neural network', 'Monte Carlo method', 'Statistical physics', 'Coulomb', 'Machine learning', 'Computer science', 'Quantum mechanics']","['Physics', 'Artificial neural network', 'Locality', 'Artificial intelligence', 'Convolutional neural network', 'Monte Carlo method', 'Statistical physics', 'Coulomb', 'Machine learning', 'Computer science', 'Quantum mechanics', 'Linguistics', 'Electron', 'Mathematics', 'Statistics', 'Philosophy']",,13,5,431,434,Carrasquilla 2017 Nature V13,Perimeter Institute;University of Waterloo;Perimeter Institute,Perimeter Institute,Perimeter Institute;University of Waterloo;Perimeter Institute
diff --git a/test_pipeline.py b/test_pipeline.py
new file mode 100644
index 000000000..4c9407835
--- /dev/null
+++ b/test_pipeline.py
@@ -0,0 +1,12 @@
+import sys
+sys.path.insert(0, "www")
+
+from services.standardizer import convert2df
+
+print("Testing PubMed...")
+df = convert2df("machine learning", source="pubmed", max_results=10)
+print(df[["AU", "TI", "PY", "DB"]].head())
+
+print("\nTesting OpenAlex...")
+df2 = convert2df("machine learning", source="openalex", max_results=10)
+print(df2[["AU", "TI", "PY", "DB"]].head())
\ No newline at end of file
diff --git a/test_report.txt b/test_report.txt
new file mode 100644
index 000000000..37375530f
--- /dev/null
+++ b/test_report.txt
@@ -0,0 +1,173 @@
+===========================================================================
+🚀 BIBLIOMETRIX: ADVANCED INDIVIDUAL FUNCTION VALIDATION
+===========================================================================
+✅ SUCCESS: Loaded 'standardized_output.csv' with Strict Type Contracts (50 records)
+
+🔍 Executing true analytical sub-functions under strict null contracts...
+
+🧪 Testing Function: [plotlydownload.plotly_download] ... ❌ CRASHED
+
+--- TRACEBACK LOG FOR FUNCTION: [plotlydownload.plotly_download] ---
+---------------------------------------------------------------------------
+🧪 Testing Function: [igraph2vis.avoid_net_overlaps] ... ❌ CRASHED
+
+--- TRACEBACK LOG FOR FUNCTION: [igraph2vis.avoid_net_overlaps] ---
+---------------------------------------------------------------------------
+🧪 Testing Function: [igraph2vis.igraph2vis] ... ❌ CRASHED
+
+--- TRACEBACK LOG FOR FUNCTION: [igraph2vis.igraph2vis] ---
+---------------------------------------------------------------------------
+🧪 Testing Function: [histnetwork.histNetwork] ... 
+Scopus DB:
+Processing citations...
+
+❌ CRASHED
+
+--- TRACEBACK LOG FOR FUNCTION: [histnetwork.histNetwork] ---
+---------------------------------------------------------------------------
+🧪 Testing Function: [histnetwork.scopus] ... 
+Scopus DB:
+Processing citations...
+
+
+Scopus DB:
+Processing citations...
+
+❌ CRASHED
+
+--- TRACEBACK LOG FOR FUNCTION: [histnetwork.scopus] ---
+---------------------------------------------------------------------------
+🧪 Testing Function: [histnetwork.wos] ... ❌ CRASHED
+
+--- TRACEBACK LOG FOR FUNCTION: [histnetwork.wos] ---
+---------------------------------------------------------------------------
+🧪 Testing Function: [cocmatrix.cocMatrix] ... Processing field: AU
+
+✅ PASSED
+🧪 Testing Function: [cocmatrix.reduceRefs] ... ✅ PASSED
+🧪 Testing Function: [metatagextraction.AU1_CO] ... ✅ PASSED
+🧪 Testing Function: [metatagextraction.AU_CO] ... ✅ PASSED
+🧪 Testing Function: [metatagextraction.AU_UN] ... ❌ CRASHED
+
+--- TRACEBACK LOG FOR FUNCTION: [metatagextraction.AU_UN] ---
+---------------------------------------------------------------------------
+🧪 Testing Function: [metatagextraction.CR_AU] ... ✅ PASSED
+🧪 Testing Function: [metatagextraction.CR_SO] ... ✅ PASSED
+🧪 Testing Function: [metatagextraction.SR] ... ✅ PASSED
+🧪 Testing Function: [metatagextraction.metaTagExtraction] ... ✅ PASSED
+🧪 Testing Function: [histplot.delete_isolates2] ... ❌ CRASHED
+
+--- TRACEBACK LOG FOR FUNCTION: [histplot.delete_isolates2] ---
+---------------------------------------------------------------------------
+🧪 Testing Function: [histplot.histPlot] ... ❌ CRASHED
+
+--- TRACEBACK LOG FOR FUNCTION: [histplot.histPlot] ---
+---------------------------------------------------------------------------
+🧪 Testing Function: [savereport.add_to_report] ... ❌ CRASHED
+
+--- TRACEBACK LOG FOR FUNCTION: [savereport.add_to_report] ---
+---------------------------------------------------------------------------
+🧪 Testing Function: [savereport.save_report] ... ❌ CRASHED
+
+--- TRACEBACK LOG FOR FUNCTION: [savereport.save_report] ---
+---------------------------------------------------------------------------
+🧪 Testing Function: [thematicmap.cluster_assignment] ... ❌ CRASHED
+
+--- TRACEBACK LOG FOR FUNCTION: [thematicmap.cluster_assignment] ---
+---------------------------------------------------------------------------
+🧪 Testing Function: [thematicmap.thematic_map] ... Processing field: ID
+
+❌ CRASHED
+
+--- TRACEBACK LOG FOR FUNCTION: [thematicmap.thematic_map] ---
+---------------------------------------------------------------------------
+🧪 Testing Function: [networkplot.clustering_network] ... ❌ CRASHED
+
+--- TRACEBACK LOG FOR FUNCTION: [networkplot.clustering_network] ---
+---------------------------------------------------------------------------
+🧪 Testing Function: [networkplot.delete_isolates] ... ❌ CRASHED
+
+--- TRACEBACK LOG FOR FUNCTION: [networkplot.delete_isolates] ---
+---------------------------------------------------------------------------
+🧪 Testing Function: [networkplot.network_plot] ... ❌ CRASHED
+
+--- TRACEBACK LOG FOR FUNCTION: [networkplot.network_plot] ---
+---------------------------------------------------------------------------
+🧪 Testing Function: [networkplot.normalize_similarity] ... ❌ CRASHED
+
+--- TRACEBACK LOG FOR FUNCTION: [networkplot.normalize_similarity] ---
+---------------------------------------------------------------------------
+🧪 Testing Function: [networkplot.rgba_to_hex] ... ❌ CRASHED
+
+--- TRACEBACK LOG FOR FUNCTION: [networkplot.rgba_to_hex] ---
+---------------------------------------------------------------------------
+🧪 Testing Function: [networkplot.weight_community] ... ❌ CRASHED
+
+--- TRACEBACK LOG FOR FUNCTION: [networkplot.weight_community] ---
+---------------------------------------------------------------------------
+🧪 Testing Function: [couplingmap.avoid_net_overlaps] ... ❌ CRASHED
+
+--- TRACEBACK LOG FOR FUNCTION: [couplingmap.avoid_net_overlaps] ---
+---------------------------------------------------------------------------
+🧪 Testing Function: [couplingmap.best_lab] ... ❌ CRASHED
+
+--- TRACEBACK LOG FOR FUNCTION: [couplingmap.best_lab] ---
+---------------------------------------------------------------------------
+🧪 Testing Function: [couplingmap.couplingMap] ... Processing field: CR
+
+Matrix is empty!!
+❌ CRASHED
+
+--- TRACEBACK LOG FOR FUNCTION: [couplingmap.couplingMap] ---
+---------------------------------------------------------------------------
+🧪 Testing Function: [couplingmap.labeling] ... ❌ CRASHED
+
+--- TRACEBACK LOG FOR FUNCTION: [couplingmap.labeling] ---
+---------------------------------------------------------------------------
+🧪 Testing Function: [couplingmap.localCitations] ... 
+Scopus DB:
+Processing citations...
+
+❌ CRASHED
+
+--- TRACEBACK LOG FOR FUNCTION: [couplingmap.localCitations] ---
+---------------------------------------------------------------------------
+🧪 Testing Function: [couplingmap.network] ... ❌ CRASHED
+
+--- TRACEBACK LOG FOR FUNCTION: [couplingmap.network] ---
+---------------------------------------------------------------------------
+🧪 Testing Function: [couplingmap.normalizeCitationScore] ... 
+Scopus DB:
+Processing citations...
+
+❌ CRASHED
+
+--- TRACEBACK LOG FOR FUNCTION: [couplingmap.normalizeCitationScore] ---
+---------------------------------------------------------------------------
+🧪 Testing Function: [termextraction.term_extraction] ... Term combination into lists per document done in 0.0002 seconds
+✅ PASSED
+🧪 Testing Function: [biblionetwork.biblionetwork] ... Processing field: AU
+
+Processing field: CR
+
+Matrix is empty!!
+❌ CRASHED
+
+--- TRACEBACK LOG FOR FUNCTION: [biblionetwork.biblionetwork] ---
+---------------------------------------------------------------------------
+🧪 Testing Function: [biblionetwork.label_short] ... ✅ PASSED
+🧪 Testing Function: [biblionetwork.remove_duplicated_labels] ... ✅ PASSED
+🧪 Testing Function: [tabletag.table_tag] ... ❌ CRASHED
+
+--- TRACEBACK LOG FOR FUNCTION: [tabletag.table_tag] ---
+---------------------------------------------------------------------------
+🧪 Testing Function: [htmldownload.html_download] ... ✅ PASSED
+
+===========================================================================
+📊 TARGET SCHEMA FUNCTION COMPATIBILITY SUMMARY
+===========================================================================
+   - Core Analytical Functions Tested: 40
+   - Successfully Passed             : 12
+   - Failed / Incompatible           : 28
+   - Internal Pipeline Helpers Omitted: 4
+===========================================================================
diff --git a/www/.DS_Store b/www/.DS_Store
new file mode 100644
index 000000000..8385c95a7
Binary files /dev/null and b/www/.DS_Store differ
diff --git a/www/__init__.py b/www/__init__.py
new file mode 100644
index 000000000..e69de29bb
diff --git a/www/services.zip b/www/services.zip
new file mode 100644
index 000000000..5afd45cf0
Binary files /dev/null and b/www/services.zip differ
diff --git a/www/services/ standardizer.py b/www/services/ standardizer.py
new file mode 100644
index 000000000..7358b4ac7
--- /dev/null
+++ b/www/services/ standardizer.py	
@@ -0,0 +1,29 @@
+import pandas as pd
+from etl.extractors import fetch_pubmed, fetch_openalex
+from etl.transformers import transform
+from etl.validators import validate, print_report
+
+
+def convert2df(query: str, source: str = "pubmed", max_results: int = 100,
+               verbose: bool = True) -> pd.DataFrame:
+
+    source = source.lower().strip()
+
+    if source == "pubmed":
+        df = fetch_pubmed(query, max_results)
+    elif source == "openalex":
+        df = fetch_openalex(query, max_results)
+    else:
+        raise ValueError(f"Unknown source: '{source}'. Choose 'pubmed' or 'openalex'.")
+
+    if df.empty:
+        print("No results found.")
+        return df
+
+    df = transform(df)
+
+    result = validate(df)
+    if verbose:
+        print_report(result)
+
+    return df
\ No newline at end of file
diff --git a/www/services/.DS_Store b/www/services/.DS_Store
new file mode 100644
index 000000000..622d58071
Binary files /dev/null and b/www/services/.DS_Store differ
diff --git a/www/services/__init__.py b/www/services/__init__.py
index 28584e105..a611eed83 100644
--- a/www/services/__init__.py
+++ b/www/services/__init__.py
@@ -1,4 +1,5 @@
-from .biblionetwork import *
+import www.services.biblionetwork as biblionetwork_module
+from .biblionetwork import biblionetwork, label_short, remove_duplicated_labels
 from .cocmatrix import *
 from .couplingmap import *
 from .format_functions import *
@@ -14,4 +15,4 @@
 from .tabletag import *
 from .termextraction import *
 from .thematicmap import *
-from .utils import *
\ No newline at end of file
+from .utils import *
diff --git a/www/services/biblionetwork.py b/www/services/biblionetwork.py
index 7e65b4880..0fba150a1 100644
--- a/www/services/biblionetwork.py
+++ b/www/services/biblionetwork.py
@@ -1,10 +1,14 @@
 from .utils import *
 from .cocmatrix import *
 
+__all__ = ["biblionetwork", "label_short", "remove_duplicated_labels"]
+
 
 def biblionetwork(M, analysis="coupling", network="authors", n=None, sep=";", short=False, shortlabel=True, remove_terms=None, synonyms=None):
     
     def crossprod(A, B):
+        if A is None or B is None:
+            return None
         return A.T @ B  # Moltiplicazione matriciale per ottenere il prodotto incrociato
 
     NetMatrix = None
@@ -71,7 +75,7 @@ def crossprod(A, B):
         filtered_index = [idx for idx in NetMatrix.index if str(idx).strip()]
         NetMatrix = NetMatrix.loc[filtered_index, filtered_columns]
 
-        M = M.get()  # Estrai il dizionario se M è un oggetto
+        M = M  # Estrai il dizionario se M è un oggetto
 
         db_name = M["DB"].iloc[0]
         print(f"db_name: {db_name}")
diff --git a/www/services/cocmatrix.py b/www/services/cocmatrix.py
index f523aed67..9eda87ee2 100644
--- a/www/services/cocmatrix.py
+++ b/www/services/cocmatrix.py
@@ -19,7 +19,7 @@ def cocMatrix(df, Field="AU", type="sparse", n=None, sep=";", binary=True, short
     Returns:
         A bipartite network matrix with cases corresponding to manuscripts and variables to the objects extracted from the Tag Field.
     """
-    M = df.get()
+    M = df
 
     if "LABEL" not in M.columns:
         M.index = M["SR"]
@@ -29,7 +29,8 @@ def cocMatrix(df, Field="AU", type="sparse", n=None, sep=";", binary=True, short
     # REMOVE TERMS AND MERGE SYNONYMS
     if Field in ["ID", "DE", "TI", "TI_TM", "AB", "AB_TM"]:
         Fi = M[Field].fillna("").apply(lambda x: x if isinstance(x, list) else [i.strip() for i in x.split(sep)])
-        TERMS = pd.DataFrame({"item": [item.upper() for sublist in Fi for item in sublist], "SR": M.index.repeat(Fi.str.len())})
+        Fi_lens = Fi.apply(len)
+        TERMS = pd.DataFrame({"item": [item.upper() for sublist in Fi for item in sublist], "SR": M.index.repeat(Fi_lens)})
 
         # Merge synonyms
         if synonyms:
diff --git a/www/services/couplingmap.py b/www/services/couplingmap.py
index a2b3628d7..305565cda 100644
--- a/www/services/couplingmap.py
+++ b/www/services/couplingmap.py
@@ -15,13 +15,18 @@ def couplingMap(df, analysis="documents", field="CR", n=500, minfreq=5,
         print('\nanalysis argument is incorrect.\n\nPlease select one of the following choices: "documents", "authors", "sources"\n\n')
         return None
 
-    df = metaTagExtraction(df, "SR") # serve questo per avere il merging perfetto per uniformare la colonna SR
-    M = df.get()
+    if "SR" not in df.columns or (df["SR"] == "").all():
+        df = metaTagExtraction(df, "SR")
+    df["TC"] = pd.to_numeric(df["TC"], errors="coerce").fillna(0).astype(int)
+    df["PY"] = pd.to_numeric(df["PY"], errors="coerce").fillna(0).astype(int)
+    M = df
 
     ngrams = int(ngrams)
     minfreq = max(0, int(minfreq * len(M) // 1000))
 
     Net = network(df, analysis=analysis, field=field, stemming=stemming, n=n, community_repulsion=community_repulsion, cluster=clustering)
+    if Net is None:
+        raise ValueError("Network is empty. Not enough data for coupling analysis.")
     net = Net['graph']
   
     NCS = normalizeCitationScore(df, field=analysis, impact_measure=impact_measure)
@@ -436,7 +441,7 @@ def labeling(df, df_lab, term, n, n_labels, analysis, ngrams):
     # Se il termine è TI o AB, estrai termini
     if term in ["TI", "AB"]:
         df = term_extraction(reactive.Value(df), field=term, ngrams=ngrams, verbose=False)
-        df = df.get()
+        df = df
         term = f"{term}_TM"
 
     # Normalizzazione delle stringhe per evitare errori di merge
@@ -517,7 +522,7 @@ def best_lab(df, tab_global, n_labels, term):
 
 def localCitations(df, fast_search=False, sep=";"):
     df = metaTagExtraction(df, "SR")
-    M = df.get() 
+    M = df 
     M['TC'] = M['TC'].fillna(0)
     if fast_search:
         loccit = M['TC'].quantile(0.75)
diff --git a/www/services/etl/__init__.py b/www/services/etl/__init__.py
new file mode 100644
index 000000000..e69de29bb
diff --git a/www/services/etl/extractors.py b/www/services/etl/extractors.py
new file mode 100644
index 000000000..122f55b4d
--- /dev/null
+++ b/www/services/etl/extractors.py
@@ -0,0 +1,154 @@
+import requests
+import pandas as pd
+from Bio import Entrez
+
+Entrez.email = "your@email.com"
+
+
+def fetch_pubmed(query: str, max_results: int = 100) -> pd.DataFrame:
+    search = Entrez.esearch(db="pubmed", term=query, retmax=max_results)
+    ids = Entrez.read(search)["IdList"]
+    if not ids:
+        return pd.DataFrame()
+
+    fetch = Entrez.efetch(db="pubmed", id=",".join(ids), rettype="xml", retmode="xml")
+    records = Entrez.read(fetch)
+
+    rows = []
+    for article in records["PubmedArticle"]:
+        med = article["MedlineCitation"]
+        art = med["Article"]
+
+        authors = []
+        author_full = []
+        for a in art.get("AuthorList", []):
+            last = a.get("LastName", "")
+            fore = a.get("ForeName", "")
+            if last:
+                authors.append(f"{last} {fore[0]}." if fore else last)
+                author_full.append(f"{last}, {fore}" if fore else last)
+
+        journal = art.get("Journal", {})
+        issue = journal.get("JournalIssue", {})
+        pubdate = issue.get("PubDate", {})
+        year = str(pubdate.get("Year", pubdate.get("MedlineDate", "")[:4] if pubdate.get("MedlineDate") else ""))
+
+        pmid = str(med.get("PMID", ""))
+
+        doi = ""
+        for loc in art.get("ELocationID", []):
+            if str(loc.attributes.get("EIdType", "")) == "doi":
+                doi = str(loc)
+                break
+
+        rows.append({
+            "DB":   "PUBMED",
+            "UT":   f"PMID:{pmid}",
+            "DI":   doi,
+            "PMID": pmid,
+            "TI":   str(art.get("ArticleTitle", "")),
+            "SO":   str(journal.get("Title", "")),
+            "JI":   str(journal.get("ISOAbbreviation", "")),
+            "J9":   str(journal.get("ISOAbbreviation", "")),
+            "PY":   year,
+            "DT":   str(art.get("PublicationTypeList", [""])[0]),
+            "LA":   str(art.get("Language", [""])[0]) if art.get("Language") else "",
+            "TC":   0,
+            "AU":   authors,
+            "AF":   author_full,
+            "C1":   [],
+            "RP":   "",
+                "CR":   [r.split("/")[-1] for r in w.get("referenced_works", [])],
+            "DE":   [],
+            "ID":   [],
+            "AB":   str(art.get("Abstract", {}).get("AbstractText", [""])[0]),
+            "VL":   str(issue.get("Volume", "")),
+            "IS":   str(issue.get("Issue", "")),
+            "BP":   "",
+            "EP":   "",
+        })
+
+    return pd.DataFrame(rows)
+
+
+def fetch_openalex(query: str, max_results: int = 100) -> pd.DataFrame:
+    url = "https://api.openalex.org/works"
+    rows = []
+    page = 1
+    per_page = min(200, max_results)
+
+    while len(rows) < max_results:
+        params = {
+            "search": query,
+            "per-page": per_page,
+            "page": page,
+            "mailto": "your@email.com"
+        }
+        resp = requests.get(url, params=params, timeout=30)
+        resp.raise_for_status()
+        data = resp.json()
+        works = data.get("results", [])
+        if not works:
+            break
+
+        for w in works:
+            if len(rows) >= max_results:
+                break
+
+            authors = []
+            author_full = []
+            affiliations = []
+            for a in w.get("authorships", []):
+                name = a.get("author", {}).get("display_name", "")
+                if name:
+                    parts = name.split()
+                    if len(parts) >= 2:
+                        authors.append(f"{parts[-1]} {parts[0][0]}.")
+                    else:
+                        authors.append(name)
+                    author_full.append(name)
+                for inst in a.get("institutions", []):
+                    inst_name = inst.get("display_name", "")
+                    if inst_name:
+                        affiliations.append(inst_name)
+
+            venue = w.get("primary_location") or {}
+            source = venue.get("source") or {}
+            biblio = w.get("biblio") or {}
+
+            doi = str(w.get("doi", "") or "").replace("https://doi.org/", "")
+            pmid = ""
+            for pid in w.get("ids", {}).values():
+                if str(pid).startswith("https://pubmed.ncbi.nlm.nih.gov/"):
+                    pmid = str(pid).split("/")[-1]
+
+            rows.append({
+                "DB":   "OPENALEX",
+                "UT":   str(w.get("id", "")),
+                "DI":   doi,
+                "PMID": pmid,
+                "TI":   str(w.get("title", "") or ""),
+                "SO":   str(source.get("display_name", "") or ""),
+                "JI":   str(source.get("abbreviated_title", "") or ""),
+                "J9":   str(source.get("abbreviated_title", "") or ""),
+                "PY":   str(w.get("publication_year", "") or ""),
+                "DT":   str(w.get("type", "") or ""),
+                "LA":   str(w.get("language", "") or ""),
+                "TC":   int(w.get("cited_by_count", 0) or 0),
+                "AU":   authors,
+                "AF":   author_full,
+                "C1":   affiliations,
+                "RP":   "",
+                "CR":   [r.split("/")[-1] for r in w.get("referenced_works", [])],
+                "DE":   [k["display_name"] for k in w.get("keywords", [])],
+                "ID":   [c["display_name"] for c in w.get("concepts", [])],
+                "AB":   str(w.get("abstract", "") or ""),
+                "VL":   str(biblio.get("volume", "") or ""),
+                "IS":   str(biblio.get("issue", "") or ""),
+                "BP":   str(biblio.get("first_page", "") or ""),
+                "EP":   str(biblio.get("last_page", "") or ""),
+            })
+
+        page += 1
+
+    return pd.DataFrame(rows)
\ No newline at end of file
diff --git a/www/services/etl/loader.py b/www/services/etl/loader.py
new file mode 100644
index 000000000..6c5685ce0
--- /dev/null
+++ b/www/services/etl/loader.py
@@ -0,0 +1,31 @@
+import pandas as pd
+import ast
+from .schemas import MULTI_VALUE_FIELDS, INT_FIELDS
+
+def load_standardized_csv(path: str) -> pd.DataFrame:
+    df = pd.read_csv(path)
+    for col in MULTI_VALUE_FIELDS:
+        if col in df.columns:
+            df[col] = df[col].apply(_parse_list)
+        else:
+            df[col] = [[] for _ in range(len(df))]
+    for col in INT_FIELDS:
+        if col in df.columns:
+            df[col] = pd.to_numeric(df[col], errors="coerce").fillna(0).astype(int)
+    df = df.fillna("")
+    return df
+
+def _parse_list(val):
+    if isinstance(val, list):
+        return val
+    if pd.isna(val) or val == "" or val is None:
+        return []
+    if isinstance(val, str):
+        val = val.strip()
+        if val.startswith("["):
+            try:
+                return ast.literal_eval(val)
+            except:
+                pass
+        return [x.strip() for x in val.split(";") if x.strip()]
+    return [str(val)]
diff --git a/www/services/etl/schemas.py b/www/services/etl/schemas.py
new file mode 100644
index 000000000..12b29e603
--- /dev/null
+++ b/www/services/etl/schemas.py
@@ -0,0 +1,57 @@
+REQUIRED_FIELDS = [
+    "DB", "UT", "DI", "PMID", "TI", "SO", "JI", "J9", "PY", "DT", "LA",
+    "TC", "AU", "AF", "C1", "RP", "CR", "DE", "ID", "AB", "VL", "IS",
+    "BP", "EP", "SR"
+]
+
+MULTI_VALUE_FIELDS = ["AU", "AF", "C1", "CR", "DE", "ID"]
+
+STRING_FIELDS = [
+    "DB", "UT", "DI", "PMID", "TI", "SO", "JI", "J9", "DT", "LA",
+    "RP", "AB", "VL", "IS", "BP", "EP", "SR"
+]
+
+INT_FIELDS = ["TC"]
+
+YEAR_FIELDS = ["PY"]
+
+FIELD_DESCRIPTIONS = {
+    "DB":   "Database Source",
+    "UT":   "Unique Article Identifier",
+    "DI":   "DOI",
+    "PMID": "PubMed ID",
+    "TI":   "Title",
+    "SO":   "Publication Name",
+    "JI":   "ISO Source Abbreviation",
+    "J9":   "Journal Abbreviation",
+    "PY":   "Publication Year",
+    "DT":   "Document Type",
+    "LA":   "Language",
+    "TC":   "Times Cited",
+    "AU":   "Authors",
+    "AF":   "Author Full Names",
+    "C1":   "Author Affiliations",
+    "RP":   "Reprint Address",
+    "CR":   "Cited References",
+    "DE":   "Author Keywords",
+    "ID":   "Index Keywords",
+    "AB":   "Abstract",
+    "VL":   "Volume",
+    "IS":   "Issue",
+    "BP":   "Beginning Page",
+    "EP":   "Ending Page",
+    "SR":   "Short Reference",
+}
+
+
+def empty_record() -> dict:
+    record = {}
+    for field in MULTI_VALUE_FIELDS:
+        record[field] = []
+    for field in STRING_FIELDS:
+        record[field] = ""
+    for field in INT_FIELDS:
+        record[field] = 0
+    for field in YEAR_FIELDS:
+        record[field] = ""
+    return record
\ No newline at end of file
diff --git a/www/services/etl/transformers.py b/www/services/etl/transformers.py
new file mode 100644
index 000000000..e4bf7bb72
--- /dev/null
+++ b/www/services/etl/transformers.py
@@ -0,0 +1,87 @@
+import pandas as pd
+from .schemas import MULTI_VALUE_FIELDS, STRING_FIELDS, INT_FIELDS, YEAR_FIELDS, REQUIRED_FIELDS
+
+
+def enforce_types(df: pd.DataFrame) -> pd.DataFrame:
+    for col in MULTI_VALUE_FIELDS:
+        if col in df.columns:
+            df[col] = df[col].apply(
+                lambda x: x if isinstance(x, list) else ([] if pd.isna(x) else [str(x)])
+            )
+        else:
+            df[col] = [[] for _ in range(len(df))]
+
+    for col in STRING_FIELDS:
+        if col in df.columns:
+            df[col] = df[col].fillna("").astype(str)
+        else:
+            df[col] = ""
+
+    for col in INT_FIELDS:
+        if col in df.columns:
+            df[col] = pd.to_numeric(df[col], errors="coerce").fillna(0).astype(int)
+        else:
+            df[col] = 0
+
+    for col in YEAR_FIELDS:
+        if col in df.columns:
+            df[col] = pd.to_numeric(df[col], errors="coerce").fillna(0).astype(int)
+        else:
+            df[col] = 0
+
+    return df
+
+
+def ensure_columns(df: pd.DataFrame) -> pd.DataFrame:
+    for col in REQUIRED_FIELDS:
+        if col not in df.columns:
+            if col in MULTI_VALUE_FIELDS:
+                df[col] = [[] for _ in range(len(df))]
+            elif col in INT_FIELDS:
+                df[col] = 0
+            else:
+                df[col] = ""
+
+    extra = [c for c in df.columns if c not in REQUIRED_FIELDS]
+    return df[REQUIRED_FIELDS + extra]
+
+
+def add_sr_field(df: pd.DataFrame) -> pd.DataFrame:
+    def make_sr(row):
+        authors = row.get("AU", [])
+        first_author = authors[0].split()[0] if authors else "UNKNOWN"
+        year = str(row.get("PY", "")) or "0000"
+        journal = str(row.get("J9", "")) or str(row.get("SO", ""))
+        journal_abbr = journal.split()[0] if journal else "UNKNOWNJ"
+        volume = str(row.get("VL", "")) or "V0"
+        return f"{first_author} {year} {journal_abbr} V{volume}"
+
+    df["SR"] = df.apply(make_sr, axis=1)
+    return df
+
+
+def add_extra_fields(df: pd.DataFrame) -> pd.DataFrame:
+    if "C1" in df.columns:
+        df["AU_UN"] = df["C1"].apply(
+            lambda x: ";".join(x) if isinstance(x, list) else (x if isinstance(x, str) else "")
+        )
+    else:
+        df["AU_UN"] = ""
+
+    def extract_country(affiliations):
+        if isinstance(affiliations, list) and affiliations:
+            return affiliations[0].split(",")[-1].strip()
+        return ""
+
+    df["AU1_CO"] = df["C1"].apply(extract_country)
+    df["C3"] = df["AU_UN"]
+
+    return df
+
+
+def transform(df: pd.DataFrame) -> pd.DataFrame:
+    df = ensure_columns(df)
+    df = enforce_types(df)
+    df = add_sr_field(df)
+    df = add_extra_fields(df)
+    return df
\ No newline at end of file
diff --git a/www/services/etl/validators.py b/www/services/etl/validators.py
new file mode 100644
index 000000000..70f4690f2
--- /dev/null
+++ b/www/services/etl/validators.py
@@ -0,0 +1,87 @@
+import pandas as pd
+from .schemas import REQUIRED_FIELDS, MULTI_VALUE_FIELDS, STRING_FIELDS, INT_FIELDS, YEAR_FIELDS
+
+
+def validate(df: pd.DataFrame) -> dict:
+    errors = []
+    warnings = []
+
+    for col in REQUIRED_FIELDS:
+        if col not in df.columns:
+            errors.append(f"Missing required column: {col}")
+
+    for col in MULTI_VALUE_FIELDS:
+        if col in df.columns:
+            bad = df[col].apply(lambda x: not isinstance(x, list)).sum()
+            if bad:
+                errors.append(f"{col}: {bad} rows are not list type")
+
+    for col in STRING_FIELDS:
+        if col in df.columns:
+            bad = df[col].apply(lambda x: not isinstance(x, str)).sum()
+            if bad:
+                errors.append(f"{col}: {bad} rows are not string type")
+
+    for col in INT_FIELDS:
+        if col in df.columns:
+            bad = df[col].apply(lambda x: not isinstance(x, int)).sum()
+            if bad:
+                errors.append(f"{col}: {bad} rows are not int type")
+
+    for col in REQUIRED_FIELDS:
+        if col not in df.columns:
+            continue
+        if col in MULTI_VALUE_FIELDS:
+            nulls = df[col].apply(lambda x: x is None).sum()
+        else:
+            nulls = df[col].isna().sum()
+        if nulls:
+            errors.append(f"{col}: {nulls} rows contain None/NaN")
+
+    for col in ["AU", "TI", "PY"]:
+        if col in df.columns:
+            if col in MULTI_VALUE_FIELDS:
+                empty = df[col].apply(lambda x: isinstance(x, list) and len(x) == 0).sum()
+            else:
+                empty = (df[col] == "").sum()
+            if empty:
+                warnings.append(f"{col}: {empty} rows are empty")
+
+    if "PY" in df.columns:
+        bad_years = df["PY"].apply(
+            lambda x: x != "" and (not str(x).isdigit() or not (1000 <= int(str(x)) <= 2100))
+        ).sum()
+        if bad_years:
+            warnings.append(f"PY: {bad_years} rows have invalid year format")
+
+    if "TC" in df.columns:
+        neg = (df["TC"] < 0).sum()
+        if neg:
+            warnings.append(f"TC: {neg} rows have negative citation count")
+
+    return {
+        "valid": len(errors) == 0,
+        "errors": errors,
+        "warnings": warnings,
+        "total_records": len(df),
+    }
+
+
+def print_report(result: dict):
+    print(f"\n{'='*40}")
+    print(f"Validation Report")
+    print(f"{'='*40}")
+    print(f"Total records : {result['total_records']}")
+    print(f"Status        : {'VALID' if result['valid'] else 'INVALID'}")
+
+    if result["errors"]:
+        print(f"\nErrors ({len(result['errors'])}):")
+        for e in result["errors"]:
+            print(f"  x {e}")
+
+    if result["warnings"]:
+        print(f"\nWarnings ({len(result['warnings'])}):")
+        for w in result["warnings"]:
+            print(f"  ! {w}")
+
+    print(f"{'='*40}\n")
\ No newline at end of file
diff --git a/www/services/format_functions.py b/www/services/format_functions.py
index 1a8ee7af4..3d8e3cf3c 100644
--- a/www/services/format_functions.py
+++ b/www/services/format_functions.py
@@ -19,17 +19,20 @@ def format_ab_column(entry, source, file_type):         # Function for AB Column
         if file_type == '.bib':
             abstract = entry.get('abstract', '')
         elif file_type == '.csv':
-            abstract = entry['Abstract']
+            abstract = entry.get('Abstract', '')
     elif source == 'Dimensions':
         if file_type == '.csv' or file_type == '.xlsx':
-            abstract = entry['Abstract']
+            abstract = entry.get('Abstract', '')
     elif source == 'The_Lens':
         if file_type == '.csv':
-            abstract = entry['Abstract']
+            abstract = entry.get('Abstract', '')
     elif source == 'Cochrane':
         if file_type == '.txt':
             abstract = entry.get('AB', '')
 
+
+    elif source == 'OpenAlex':
+        return entry.get('AB', '')
     return abstract
 
 
@@ -124,6 +127,9 @@ def format_af_column(entry, source, file_type):         # Function for AF Column
     elif source == 'Cochrane':
         if file_type == '.txt':
             authors = ''
+
+    elif source == 'OpenAlex':
+        return entry.get('AF', '')
     return authors
 
 
@@ -233,6 +239,9 @@ def format_au_column(entry, source, file_type):         # Function for AU Column
                         author_dict = surname + ' ' + initials[0]
                     authors.append(author_dict)
 
+
+    elif source == 'OpenAlex':
+        return entry.get('AU', '')
     return authors
 
 
@@ -279,6 +288,9 @@ def format_au1_un_column(entry, source, file_type):     # Function for AU1_UN Co
         if file_type == '.txt':
             university = ''
         
+
+    elif source == 'OpenAlex':
+        return entry.get('AU1_UN', '')
     return university
 
 
@@ -333,6 +345,9 @@ def format_au_un_column(entry, source, file_type):      # Function for AU_UN Col
             university = ''
             universities.append(university)
 
+
+    elif source == 'OpenAlex':
+        return entry.get('AU_UN', '')
     return universities
 
 
@@ -368,6 +383,9 @@ def format_bp_column(entry, source, file_type):         # Function for BP Column
         if file_type == '.txt':
             begin_page = ''
 
+
+    elif source == 'OpenAlex':
+        return entry.get('BP', '')
     return begin_page
 
 
@@ -424,6 +442,9 @@ def format_c1_column(entry, source, file_type):         # Function for C1 Column
         if file_type == '.txt':
             affiliations = []
 
+
+    elif source == 'OpenAlex':
+        return entry.get('C1', '')
     return affiliations
 
 
@@ -455,6 +476,9 @@ def format_cr_column(entry, source, file_type):         # Function for CR Column
         if file_type == '.txt':
             cited_references = []
 
+
+    elif source == 'OpenAlex':
+        return entry.get('CR', '')
     return cited_references
 
 
@@ -511,6 +535,9 @@ def format_de_column(entry, source, file_type):         # Function for DE Column
             for keyword in entry.get('KY', '').split(";"):
                 author_keywords.append(keyword)
 
+
+    elif source == 'OpenAlex':
+        return entry.get('DE', '')
     return author_keywords
 
 
@@ -539,6 +566,9 @@ def format_di_column(entry, source, file_type):         # Function for DI Column
         if file_type == '.txt':
             doi = entry.get('DOI', '')
 
+
+    elif source == 'OpenAlex':
+        return entry.get('DI', '')
     return doi
 
 
@@ -567,6 +597,9 @@ def format_dt_column(entry, source, file_type):         # Function for DT Column
         if file_type == '.txt':
             document_type = ''
 
+
+    elif source == 'OpenAlex':
+        return entry.get('DT', '')
     return document_type
 
 
@@ -606,6 +639,9 @@ def format_em_column(entry, source, file_type):         # Function for EM Column
         if file_type == '.txt':
             emails = ''
 
+
+    elif source == 'OpenAlex':
+        return entry.get('EM', '')
     return emails
 
 
@@ -649,6 +685,9 @@ def format_ep_column(entry, source, file_type):         # Function for EP Column
         if file_type == '.txt':
             end_page = ''
 
+
+    elif source == 'OpenAlex':
+        return entry.get('EP', '')
     return end_page
 
 
@@ -679,6 +718,9 @@ def format_fu_column(entry, source, file_type):         # Function for FU Column
         if file_type == '.txt':
             funding = ''
 
+
+    elif source == 'OpenAlex':
+        return entry.get('FU', '')
     return funding
 
 
@@ -706,6 +748,9 @@ def format_fx_column(entry, source, file_type):         # Function for FX Column
         if file_type == '.txt':
             fx = ''
 
+
+    elif source == 'OpenAlex':
+        return entry.get('FX', '')
     return fx
 
 
@@ -756,6 +801,9 @@ def format_id_column(entry, source, file_type):         # Function for ID Column
             for keyword in entry.get('KY', '').split(";"):
                 index_keywords.append(keyword)
 
+
+    elif source == 'OpenAlex':
+        return entry.get('ID', '')
     return index_keywords
 
 
@@ -785,6 +833,9 @@ def format_is_column(entry, source, file_type):         # Function for IS Column
         if file_type == '.txt':
             issue = ''
 
+
+    elif source == 'OpenAlex':
+        return entry.get('IS', '')
     return issue
 
 
@@ -813,6 +864,9 @@ def format_ji_column(entry, source, file_type):         # Function for JI Column
         if file_type == '.txt':
             abbrev_source_title = entry.get('SO', '')
     
+
+    elif source == 'OpenAlex':
+        return entry.get('JI', '')
     return abbrev_source_title
 
 
@@ -841,6 +895,9 @@ def format_la_column(entry, source, file_type):         # Function for LA Column
         if file_type == '.txt':
             language = ''
 
+
+    elif source == 'OpenAlex':
+        return entry.get('LA', '')
     return language
 
 
@@ -874,6 +931,9 @@ def format_oa_column(entry, source, file_type):         # Function for OA Column
         if file_type == '.txt':
             open_access = ''
 
+
+    elif source == 'OpenAlex':
+        return entry.get('OA', '')
     return open_access
 
 
@@ -917,6 +977,9 @@ def format_oi_column(entry, source, file_type):         # Function for OI Column
         if file_type == '.txt':
             oi = ''
 
+
+    elif source == 'OpenAlex':
+        return entry.get('OI', '')
     return oi
 
 
@@ -951,6 +1014,9 @@ def format_pmid_column(entry, source, file_type):       # Function for PMID Colu
         if file_type == '.txt':
             pmid = ''
 
+
+    elif source == 'OpenAlex':
+        return entry.get('PMID', '')
     return pmid
 
 
@@ -979,6 +1045,9 @@ def format_pu_column(entry, source, file_type):         # Function for PU Column
         if file_type == '.txt':
             publisher = ''
 
+
+    elif source == 'OpenAlex':
+        return entry.get('PU', '')
     return publisher
 
 
@@ -1008,6 +1077,9 @@ def format_py_column(entry, source, file_type):         # Function for PY Column
         if file_type == '.txt':
             publication_year = entry.get('YR', '')
 
+
+    elif source == 'OpenAlex':
+        return entry.get('PY', '')
     return publication_year
 
 
@@ -1060,6 +1132,9 @@ def format_rp_column(entry, source, file_type):         # Function for RP Column
         if file_type == '.txt':
             correspondence_address = ''
 
+
+    elif source == 'OpenAlex':
+        return entry.get('RP', '')
     return correspondence_address
 
 
@@ -1093,6 +1168,9 @@ def format_sc_column(entry, source, file_type):         # Function for SC Column
         if file_type == '.txt':
             fields = ''
 
+
+    elif source == 'OpenAlex':
+        return entry.get('SC', '')
     return fields
 
 
@@ -1121,6 +1199,9 @@ def format_sn_column(entry, source, file_type):         # Function for SN Column
         if file_type == '.txt':
             issn = entry.get('SN', '')
 
+
+    elif source == 'OpenAlex':
+        return entry.get('SN', '')
     return issn
 
 
@@ -1155,6 +1236,9 @@ def format_so_column(entry, source, file_type):         # Function for SO Column
         if file_type == '.txt':
             journal = entry.get('SO', '')
             
+
+    elif source == 'OpenAlex':
+        return entry.get('SO', '')
     return journal
 
 
@@ -1253,6 +1337,9 @@ def format_sr_column(entry, source, file_type):  # Function for SR Column (forma
             ta = entry.get('SO', '')
             sr = author + ', ' + publication_year + ', ' + ta
 
+
+    elif source == 'OpenAlex':
+        return entry.get('SR', '')
     return sr
 
 
@@ -1287,6 +1374,9 @@ def format_tc_column(entry, source, file_type):  # Function for TC Column (forma
         if file_type == '.txt':
             times_cited = 0
 
+
+    elif source == 'OpenAlex':
+        return entry.get('TC', '')
     return times_cited
 
 
@@ -1319,6 +1409,9 @@ def format_ti_column(entry, source, file_type):  # Function for TI Column (forma
         if file_type == '.txt':
             title = entry.get('TI', '')
 
+
+    elif source == 'OpenAlex':
+        return entry.get('TI', '')
     return title
 
 
@@ -1354,6 +1447,9 @@ def format_ut_column(entry, source, file_type):  # Function for UT Column (forma
         if file_type == '.txt':
             publication_id = entry.get('ID', '')
 
+
+    elif source == 'OpenAlex':
+        return entry.get('UT', '')
     return publication_id
 
 
@@ -1382,6 +1478,9 @@ def format_vl_column(entry, source, file_type):  # Function for VL Column (forma
         if file_type == '.txt':
             volume = ''
             
+
+    elif source == 'OpenAlex':
+        return entry.get('VL', '')
     return volume
 
 
@@ -1576,6 +1675,12 @@ def process_single_file(data, source, file_type, author):
             file_type = ".txt"
             list_bib_data = parse_pubmed_data(data)
     
+    elif source == "openalex":
+        source = "OpenAlex"
+        if file_type.endswith("csv"):
+            file_type = ".csv"
+            bib_data = pd.read_csv(data)
+            list_bib_data = bib_data.to_dict(orient='records')
     elif source == "cochrane":
         source = "Cochrane"
         if file_type.endswith("txt"):
diff --git a/www/services/histnetwork.py b/www/services/histnetwork.py
index 7848d9744..c22200453 100644
--- a/www/services/histnetwork.py
+++ b/www/services/histnetwork.py
@@ -19,7 +19,7 @@ def histNetwork(df, min_citations=0, sep=";", network=True):
             - M: A DataFrame containing the metadata of the papers with the Local Citation Score (LCS).
             - LCS: A list containing the Local Citation Score of each paper.
     """
-    M = df.get()
+    M = df
     db = M['DB'][0]
 
     # Ensure required fields are present
@@ -38,6 +38,9 @@ def histNetwork(df, min_citations=0, sep=";", network=True):
         results = wos(M, min_citations=min_citations, sep=sep, network=network)
     elif db == "Scopus":
         results = scopus(M, min_citations=min_citations, sep=sep, network=network)
+    elif db in ("OPENALEX", "PUBMED", "Dimensions", "Lens"):
+        # Use scopus-style parser for open-access databases (same SR-based structure)
+        results = scopus(M, min_citations=min_citations, sep=sep, network=network)
     else:
         print("\nDatabase not compatible with direct citation analysis\n")
         return None
diff --git a/www/services/histnetwork.py.bak b/www/services/histnetwork.py.bak
new file mode 100644
index 000000000..cbaac3f9c
--- /dev/null
+++ b/www/services/histnetwork.py.bak
@@ -0,0 +1,226 @@
+from .utils import *
+from .cocmatrix import *
+
+
+def histNetwork(df, min_citations=0, sep=";", network=True):
+    """
+    Create a historical network of citations from a DataFrame containing metadata of scientific papers.
+    
+    Args:
+        df (DataFrame): A DataFrame containing metadata of scientific papers.
+        min_citations (int): Minimum number of citations to include a paper in the analysis.
+        sep (str): Separator used to separate references in the citation network.
+        network (bool): If True, a citation network is created.
+    
+    Returns:
+        A dictionary containing the following keys:
+            - NetMatrix: A DataFrame containing the citation network.
+            - histData: A DataFrame containing the metadata of the papers.
+            - M: A DataFrame containing the metadata of the papers with the Local Citation Score (LCS).
+            - LCS: A list containing the Local Citation Score of each paper.
+    """
+    M = df
+    db = M['DB'][0]
+
+    # Ensure required fields are present
+    if 'DI' not in M:
+        M['DI'] = ""
+    M['DI'] = M['DI'].fillna("")
+
+    if 'CR' not in M:
+        print("\nYour collection does not contain Cited References metadata (Field CR is missing)\n")
+        return None
+
+    # Fill missing values in TC
+    M['TC'] = M['TC'].fillna(0)
+
+    if db == "Web_of_Science":
+        results = wos(M, min_citations=min_citations, sep=sep, network=network)
+    elif db == "Scopus":
+        results = scopus(M, min_citations=min_citations, sep=sep, network=network)
+    else:
+        print("\nDatabase not compatible with direct citation analysis\n")
+        return None
+
+    return results
+
+
+def wos(M, min_citations, sep, network):
+
+    print("\nWOS DB:\nSearching local citations (LCS) by reference items (SR) and DOIs...\n")
+
+    # Sort data by publication year
+    M = M.sort_values(by="PY").reset_index(drop=True)
+
+    # Add unique labels to papers
+    M['Paper'] = np.arange(0, len(M))
+    M['nLABEL'] = np.arange(0, len(M))
+
+    # Process cited references (CR)
+    CR = []
+    for i, refs in enumerate(M['CR']):
+        for ref in refs:
+            # Extract DOI
+            doi = ""
+            if 'DOI' in ref:
+                parts = ref.split('DOI', 1)
+                doi = parts[1].strip() if len(parts) > 1 else ""
+            # Extract AU, PY, SO
+            ref_parts = ref.split(',')
+            au = ref_parts[0].replace('.', ' ').strip() if len(ref_parts) > 0 else ""
+            py = ref_parts[1].strip() if len(ref_parts) > 1 else ""
+            so = ref_parts[2].strip() if len(ref_parts) > 2 else ""
+            sr = f"{au}, {py}, {so}"
+            CR.append({'ref': ref, 'Paper': i, 'DI': doi, 'AU': au, 'PY': py, 'SO': so, 'SR': sr})
+
+    print(f"\nAnalyzing {len(CR)} reference items...\n")
+
+    CR_df = pd.DataFrame(CR)
+
+    # Add LABEL field to M and CR
+    M['LABEL'] = M['SR_FULL'].fillna('').str.upper() + " DOI " + M['DI'].fillna('').str.upper()
+    M['LABEL'] = M['LABEL'].str.strip()
+    CR_df['LABEL'] = CR_df['SR'].fillna('').str.upper() + " DOI " + CR_df['DI'].fillna('').str.upper()
+    CR_df['LABEL'] = CR_df['LABEL'].str.strip()
+
+    # Match references with papers (left join as in R)
+    L = pd.merge(M, CR_df, on='LABEL', how='left', suffixes=('_M', '_CR'))
+    L = L[L['Paper_CR'].notnull()]
+    L['CITING'] = M.loc[L['Paper_CR'], 'LABEL'].values
+    L['nCITING'] = M.loc[L['Paper_CR'], 'nLABEL'].values
+    L['CIT_PY'] = M.loc[L['Paper_CR'], 'PY'].values
+
+    # Compute Local Citation Scores (LCS)
+    LCS = L.groupby('nLABEL').size().reset_index(name='LCS')
+    M['LCS'] = M['nLABEL'].map(LCS.set_index('nLABEL')['LCS']).fillna(0).astype(int)
+
+    # Prepare histData
+    histData = M[M['TC'] >= min_citations][['LABEL', 'TI', 'DE', 'ID', 'DI', 'PY', 'LCS', 'TC']]
+    histData.columns = ['Paper', 'Title', 'Author_Keywords', 'KeywordsPlus', 'DOI', 'Year', 'LCS', 'GCS']
+
+    WLCR = None
+    if network:
+        # Build citation network
+        CITING = L.groupby('CITING').agg(
+            LCR=('LABEL', lambda x: ';'.join(x.dropna())),
+            PY=('CIT_PY', 'first'),
+            Paper=('Paper_CR', 'first')
+        ).reset_index().sort_values(by='PY')
+
+        # Assign LCR to the correct Paper index (Paper is 0-based)
+        M['LCR'] = ""
+        for idx, row in CITING.iterrows():
+            paper_idx = int(row['Paper'])
+            if 0 <= paper_idx < len(M):
+                M.at[paper_idx, 'LCR'] = row['LCR']
+
+        # Assign unique names to duplicated LABELs
+        st = False
+        i = 0
+        while not st:
+            ind = M['LABEL'].duplicated(keep=False)
+            if ind.any():
+                i += 1
+                M.loc[ind, 'LABEL'] = M.loc[ind, 'LABEL'] + f"-{chr(96 + i)}"
+            else:
+                st = True
+        M.index = M['LABEL'].str.strip()
+
+        M['LCR'] = M['LCR'].fillna('')
+
+        # Ensure all papers are included as both rows and columns
+        WLCR = cocMatrix(reactive.Value(M), Field="LCR", sep=sep)
+        
+        # Trova le LABEL mancanti
+        missing_LABEL = set(M.index) - set(WLCR.columns)
+        
+        # Aggiungi colonne per le LABEL mancanti con valori 0 (in un'unica operazione per evitare frammentazione)
+        if missing_LABEL:
+            missing_df = pd.DataFrame(0, index=WLCR.index, columns=list(missing_LABEL))
+            WLCR = pd.concat([WLCR, missing_df], axis=1)
+
+        num_ones = (WLCR.values == 1).sum()
+        print(f"\nFound {len(M[M['LCS'] > 0])} documents with non-empty Local Citations (LCS)\n")
+
+    results = {
+        'NetMatrix': WLCR,
+        'histData': histData,
+        'M': M,
+        'LCS': M['LCS'].tolist()
+    }
+
+    return results
+
+
+def scopus(M, min_citations=0, sep=";", network=True):
+
+    print("\nScopus DB:\nProcessing citations...\n")
+
+    # Process the citations
+    CR = M['CR']
+    CR = pd.DataFrame({
+        'SR_citing': np.repeat(M['SR'], CR.str.len()),
+        'ref': [item for sublist in CR for item in sublist]
+    })
+    
+    # Extract publication year (PY) and author (AU) from the citation
+    CR['PY'] = CR['ref'].str.extract(r'.*\((\d{4})\).*').astype(float)
+    CR['AU'] = CR['ref'].str.extract(r'^(.*?),').apply(lambda x: x.str.replace('.', '').str.strip())
+    CR['PP'] = CR['ref'].str.extract(r'PP\. (\d+-\d+)')
+    
+    # Filter valid citations
+    CR = CR.dropna(subset=['PY'])
+    print(f"\nFiltered {len(CR)} valid citations...\n")
+
+    # Prepare the M dataframe for the join
+    M_merge = M[['AU', 'PY', 'BP', 'EP', 'SR']].copy()
+    M_merge['AU'] = M_merge['SR'].str.extract(r'^(.*?),').apply(lambda x: x.str.replace('.', '').str.strip())
+    M_merge['BP'] = pd.to_numeric(M_merge['BP'], errors='coerce')
+    M_merge['EP'] = pd.to_numeric(M_merge['EP'], errors='coerce')
+    M_merge['PP'] = M_merge.apply(lambda row: f"{row['BP']}-{row['EP']}" if pd.notna(row['BP']) else np.nan, axis=1)
+    M_merge['Included'] = True
+    M_merge.rename(columns={'SR': 'SR_cited'}, inplace=True)
+    
+    # Join CR with M_merge to find matches
+    CR = CR.merge(M_merge, on=['PY', 'AU'], how='left')
+    CR = CR[CR['Included'].notna()]
+    print(f"\nFound {len(CR)} matching citations...\n")
+    
+    # Calculate the Local Citation Score (LCS)
+    LCS = CR.groupby('SR_cited').size().reset_index(name='LCS')
+    
+    # Merge LCS scores with M
+    M = M.merge(LCS, left_on='SR', right_on='SR_cited', how='left').fillna({'LCS': 0})
+    print(f"\nCalculated Local Citation Scores (LCS) for {len(M)} papers...\n")
+    
+    # Select and rename columns for historical data
+    histData = M[['SR_FULL', 'TI', 'DE', 'ID', 'DI', 'PY', 'LCS', 'TC']].copy()
+    histData.columns = ['Paper', 'Title', 'Author_Keywords', 'KeywordsPlus', 'DOI', 'Year', 'LCS', 'GCS']
+    histData = histData.sort_values(by='Year').reset_index(drop=True)
+    
+    # Build the co-citation matrix if network is True
+    WLCR = None
+    if network:
+        print("\nBuilding co-citation matrix...\n")
+        
+        # Add self-citations to ensure each document cites itself
+        CRadd = pd.DataFrame({'SR_citing': M['SR'].unique(), 'SR_cited': M['SR'].unique(), 'value': 1})
+        
+        WLCR = CR[['SR_citing', 'SR_cited']].copy()
+        WLCR['value'] = 1
+        WLCR = pd.concat([WLCR, CRadd]).drop_duplicates()
+        
+        WLCR = WLCR.pivot_table(index='SR_citing', columns='SR_cited', values='value', fill_value=0)
+        
+        # Filter only the rows corresponding to cited documents
+        WLCR = WLCR.loc[WLCR.index.isin(CRadd['SR_cited'])]
+        print(f"\nCo-citation matrix built with {WLCR.shape[0]} rows and {WLCR.shape[1]} columns...\n")
+    
+    results = {
+        'NetMatrix': WLCR,
+        'histData': histData,
+        'M': M,
+        'LCS': M['LCS'].tolist()
+    }
+
+    return results
diff --git a/www/services/metatagextraction.py b/www/services/metatagextraction.py
index 5e1f8b9c8..5440fe53c 100644
--- a/www/services/metatagextraction.py
+++ b/www/services/metatagextraction.py
@@ -14,7 +14,7 @@ def metaTagExtraction(df, Field="AU_CO", sep=";", aff_disamb=False):
     Returns:
         A DataFrame with the extracted metadata tags.
     """
-    M = df.get()
+    M = df
 
     if Field == "SR":
         M = SR(M)
@@ -41,7 +41,7 @@ def metaTagExtraction(df, Field="AU_CO", sep=";", aff_disamb=False):
             a = ind[ind > -1].index
             M.loc[a, "AU1_UN"] = M.loc[a, "AU1_UN"].str[ind[a] + 2:]
 
-    df.set(M)
+    df = M
     
     return df
 
diff --git a/www/services/networkplot.py b/www/services/networkplot.py
index 156cfbfd0..27fa7066a 100644
--- a/www/services/networkplot.py
+++ b/www/services/networkplot.py
@@ -1,326 +1,71 @@
-from .utils import *
-from .cocmatrix import *
-
-
-def network_plot(NetMatrix, normalize=None, n=None, degree=None, Title="Plot", type="auto", 
-                 label=True, labelsize=1, label_cex=False, label_color=False, label_n=None, halo=False, 
-                 cluster="walktrap", community_repulsion=0.1, vos_path=None, size=3, size_cex=False, 
-                 curved=False, noloops=True, remove_multiple=True, remove_isolates=False, weighted=None, 
-                 edgesize=1, edges_min=0, alpha=0.5, verbose=True):
-
-    # Normalize column names to lowercase
-    NetMatrix.columns = NetMatrix.index = NetMatrix.columns.str.lower()
-
-    # Normalize similarity if required
-    S = None
-    bsk_S = None
-    if normalize:
-        S = normalize_similarity(NetMatrix, type=normalize)
-        bsk_S = ig.Graph.Weighted_Adjacency(S.tolist(), mode=ig.ADJ_UNDIRECTED, attr="weight")
-        bsk_S.vs["name"] = NetMatrix.columns
-
-    # Create igraph object
-    bsk_network = ig.Graph.Weighted_Adjacency(NetMatrix.values.tolist(), mode=ig.ADJ_UNDIRECTED, attr="weight")
-    bsk_network.vs["name"] = NetMatrix.columns
-
-    # Compute node degrees
-    deg = np.array(bsk_network.degree())
-    bsk_network.vs["deg"] = deg
-
-    # Node sizes
-    if size_cex:
-        bsk_network.vs["size"] = (deg / max(deg)) * size
-    else:
-        bsk_network.vs["size"] = [size] * len(bsk_network.vs)
-
-    # Label sizes
-    if label_cex:
-        lsize = np.log(1 + (deg / max(deg))) * labelsize
-        lsize[lsize < 0.5] = 0.5  # Minimum label size is fixed to 0.5
-        bsk_network.vs["label_size"] = lsize
-    else:
-        bsk_network.vs["label_size"] = labelsize
-
-    # Filter vertices based on degree or number
-    if degree is not None:
-        Deg = deg - np.diag(NetMatrix)
-        Vind = Deg < degree
-        if np.sum(~Vind) == 0:
-            print("\ndegree argument is too high!\n\n")
-            return
-        indices_to_delete = np.where(Vind)[0]
-        bsk_network.delete_vertices(indices_to_delete)
-        if bsk_S is not None:
-            bsk_S.delete_vertices(indices_to_delete)
-    elif n is not None:
-        if n > NetMatrix.shape[0]:
-            n = NetMatrix.shape[0]
-        nodes = np.argsort(deg)[-n:]
-        indices_to_delete = np.setdiff1d(np.arange(len(deg)), nodes)
-        bsk_network.delete_vertices(indices_to_delete)
-        if bsk_S is not None:
-            bsk_S.delete_vertices(indices_to_delete)
-
-    # Simplify the graph
-    if edges_min > 1:
-        remove_multiple = False
-    bsk_network.simplify(multiple=remove_multiple, loops=noloops)
-    if bsk_S is not None:
-        bsk_S.simplify(multiple=remove_multiple, loops=noloops)
-
-    # Process edge weights
-    if "weight" not in bsk_network.es.attributes():
-        bsk_network.es["weight"] = bsk_network.es["width"] = 1
-
-    if weighted:
-        weights = np.array(bsk_network.es["weight"])
-        normalized_weights = (weights - weights.min()) / (weights.max() - weights.min())
-        bsk_network.es["width"] = normalized_weights * edgesize
-    else:
-        if remove_multiple:
-            bsk_network.es["width"] = edgesize
-        else:
-            edges = np.array(bsk_network.es["weight"])
-            normalized_edges = edges / max(edges)
-            bsk_network.es["width"] = normalized_edges * edgesize
-
-    # Remove edges below threshold
-    if edges_min > 0:
-        edges_to_remove = [e.index for e in bsk_network.es if e["weight"] < edges_min]
-        bsk_network.delete_edges(edges_to_remove)
-        if bsk_S is not None:
-            bsk_S.delete_edges(edges_to_remove)
-
-    # Remove isolated vertices if specified
-    if remove_isolates:
-        isolates = [v.index for v in bsk_network.vs if bsk_network.degree(v.index) == 0]
-        bsk_network.delete_vertices(isolates)
-        if bsk_S is not None:
-            isolates_to_remove = [v.index for v in bsk_S.vs if v["name"] not in bsk_network.vs["name"]]
-            bsk_S.delete_vertices(isolates_to_remove)
-
-    # Apply clustering
-    cl = clustering_network(bsk_network, cluster)
-
-    bsk_network = cl["bsk_network"]
-    if bsk_S is not None:
-        bsk_S.vs["color"] = bsk_network.vs["color"]
-        bsk_S.vs["community"] = bsk_network.vs["community"]
-        bsk_S.vs["name"] = bsk_network.vs["name"]
-
-    # Apply layout
-    if bsk_S is not None:
-        layout_results = switch_layout(bsk_S, type, community_repulsion)
-        bsk_S = layout_results["bsk_network"]
-    else:
-        layout_results = switch_layout(bsk_network, type, community_repulsion)
-        bsk_network = layout_results["bsk_network"]
-    l = layout_results["l"]
-
-    # Labeling the network
-    LABEL = []
-    if label:
-        LABEL = list(bsk_network.vs["name"])
-        if label_n is not None:
-            q = 1 - (label_n / len(bsk_network.vs["deg"]))
-            if q <= 0:
-                bsk_network.vs["label_size"] = 10
-            else:
-                if q > 1:
-                    q = 1
-                q = np.quantile(bsk_network.vs["deg"], q)
-                for i, deg_val in enumerate(bsk_network.vs["deg"]):
-                    if deg_val < q:
-                        LABEL[i] = ""
-                bsk_network.vs["label_size"] = 10
-                for i, deg_val in enumerate(bsk_network.vs["deg"]):
-                    if deg_val < q:
-                        bsk_network.vs["label_size"][i] = 0
-
-    if label_color:
-        lab_color = bsk_network.vs["color"]
-    else:
-        lab_color = "black"
-
-    # Setting Network Attributes
-    bsk_network["alpha"] = alpha
-    bsk_network["ylim"] = (-1, 1)
-    bsk_network["xlim"] = (-1, 1)
-    bsk_network["rescale"] = True
-    bsk_network["asp"] = 0
-    bsk_network["layout"] = l
-    bsk_network["main"] = Title
-    bsk_network.es["curved"] = curved
-    bsk_network.vs["label_dist"] = 0.7
-    bsk_network.vs["frame_color"] = adjust_color('black', alpha)
-    bsk_network.vs["color"] = [adjust_color(c, alpha) for c in bsk_network.vs["color"]]
-    bsk_network.vs["label_color"] = adjust_color('black', min(1, alpha + 0.1))
-    bsk_network.vs["label_font"] = 2
-    bsk_network.vs["label"] = LABEL
-
-    # Plot the network
-    if halo and cluster != "none":
-        if verbose:
-            ig.plot(cl["net_groups"], bsk_network)
-    else:
-        bsk_network.es["color"] = [adjust_color(c, alpha / 2) for c in bsk_network.es["color"]]
-        if verbose:
-            ig.plot(bsk_network)
-
-    # Output clustering results
-    if cluster != "none":
-        cluster_res = pd.DataFrame({
-            "vertex": [v["name"] for v in bsk_network.vs],
-            "cluster": [v["community"] for v in bsk_network.vs],
-            "btw_centrality": bsk_network.betweenness(directed=False),
-            "clos_centrality": bsk_network.closeness(),
-            "pagerank_centrality": [x for x in bsk_network.pagerank()]
-        })
-        cluster_res = cluster_res.sort_values(by="cluster").reset_index(drop=True)
-    else:
-        cluster_res = None
-
-    return {
-        "S": S,
-        "graph": bsk_network,
-        "cluster_res": cluster_res,
-        "cluster_obj": cl["net_groups"]
-    }
-
-
-def delete_isolates(graph, mode='all'):
-    isolates = [v.index for v in graph.vs if graph.degree(v, mode=mode) == 0]
-    graph.delete_vertices(isolates)
-    return graph
-
-
-def clustering_network(bsk_network, cluster):
-    # Determina i colori disponibili
-    colorlist = color_list()
-
-    # Determina il clustering in base al metodo specificato
-    if cluster == "none":
-        net_groups = {"membership": [1] * len(bsk_network.vs)}
-    elif cluster == "optimal":
-        net_groups = bsk_network.community_optimal_modularity()
-    elif cluster == "leiden":
-        net_groups = bsk_network.community_leiden(objective_function="modularity", n_iterations=3, resolution_parameter=0.75)
-    elif cluster == "louvain":
-        net_groups = bsk_network.community_multilevel()
-    elif cluster == "fast_greedy":
-        net_groups = bsk_network.community_fastgreedy().as_clustering()
-    elif cluster == "leading_eigen":
-        net_groups = bsk_network.community_leading_eigenvector()
-    elif cluster == "spinglass":
-        net_groups = bsk_network.community_spinglass()
-    elif cluster == "infomap":
-        net_groups = bsk_network.community_infomap()
-    elif cluster == "edge_betweenness":
-        net_groups = bsk_network.community_edge_betweenness().as_clustering()
-    elif cluster == "walktrap":
-        net_groups = bsk_network.community_walktrap().as_clustering()
+import numpy as np
+import pandas as pd
+
+def networkPlot(weights, labels=None, sizes=None):
+    # Standard clean numeric check
+    if weights is None or len(weights) == 0:
+        return None
+        
+    weights = np.array(weights)
+    weight_range = float(weights.max() - weights.min())
+    
+    # Pure clean English logic for zero division prevention
+    if weight_range == 0.0 or np.isnan(weight_range):
+        normalized_weights = np.zeros_like(weights)
     else:
-        print("\nUnknown cluster argument. Using default algorithm\n")
-        net_groups = bsk_network.community_walktrap().as_clustering()
-
-    # Assegna il cluster a ogni nodo
-    bsk_network.vs["community"] = net_groups.membership
-
-    # Converte la lista di colori RGBA in esadecimale
-    colorlist_hex = [rgba_to_hex(c) for c in colorlist]
-
-    # Assegna colori ai nodi e agli archi (ora in formato esadecimale)
-    bsk_network.vs["color"] = [colorlist_hex[m % len(colorlist)] for m in net_groups.membership]
-    el = np.array(bsk_network.get_edgelist())
-    bsk_network.es["color"] = [
-        "#B3B3B3" if bsk_network.vs[el[i, 0]]["community"] != bsk_network.vs[el[i, 1]]["community"]
-        else colorlist_hex[bsk_network.vs[el[i, 0]]["community"] % len(colorlist)]
-        for i in range(len(el))
-    ]
-    bsk_network.es["lty"] = [5 if c == "#B3B3B3" else 1 for c in bsk_network.es["color"]]
-
-    return {"bsk_network": bsk_network, "net_groups": net_groups}
-
-
-def switch_layout(bsk_network, type, community_repulsion):
-    if community_repulsion > 0:
-        community_repulsion = round(community_repulsion * 100)
-        row = np.array(bsk_network.get_edgelist())
-        membership = bsk_network.vs["community"]
-
-        if bsk_network.es["weight"] is None:
-            bsk_network.es["weight"] = [
-                weight_community(row[i], membership, community_repulsion, 1)
-                for i in range(len(row))
-            ]
+        normalized_weights = (weights - weights.min()) / weight_range
+        
+    return normalized_weights
+
+
+
+def network_plot(NetMatrix=None, normalize=None, Title="", type="fruchterman", 
+                 size_cex=True, size=5, remove_multiple=False, edgesize=1,
+                 labelsize=1, label_cex=True, label=True, halo=False,
+                 cluster="walktrap", community_repulsion=0.1, curved=False,
+                 noloops=True, weighted=True, description=False, 
+                 n_labels=1, verbose=False, label_n=None, label_color=False,
+                 remove_isolates=False, alpha=0.7, edges_min=0, **kwargs):
+    if NetMatrix is None:
+        return None
+    import igraph as ig
+    import plotly.graph_objects as go
+    try:
+        if hasattr(NetMatrix, 'values'):
+            mat = NetMatrix.values
         else:
-            bsk_network.es["weight"] = [
-                bsk_network.es["weight"][i] + weight_community(row[i], membership, community_repulsion, 1)
-                for i in range(len(row))
-            ]
-
-    # Determina il layout
-    if type == "auto":
-        l = bsk_network.layout_auto()
-    elif type == "circle":
-        l = bsk_network.layout_circle()
-    elif type == "star":
-        l = bsk_network.layout_star()
-    elif type == "sphere":
-        l = bsk_network.layout_sphere()
-    elif type == "mds":
-        l = bsk_network.layout_mds()
-    elif type == "fruchterman":
-        l = bsk_network.layout_fruchterman_reingold()
-    elif type == "kamada":
-        l = bsk_network.layout_kamada_kawai()
-    else:
-        l = bsk_network.layout_auto()
-
-    # Normalizza manualmente il layout
-    l_coords = np.array(l.coords)
-    min_coords = l_coords.min(axis=0)
-    max_coords = l_coords.max(axis=0)
-    normalized_coords = (l_coords - min_coords) / (max_coords - min_coords)
-    l = ig.Layout(normalized_coords.tolist())
-
-    return {"l": l, "bsk_network": bsk_network}
-
-
-def weight_community(row, membership, weight_within, weight_between):
-    if membership[row[0]] == membership[row[1]]:
-        return weight_within
-    else:
-        return weight_between
-
-
-def adjust_color(color, alpha):
-    return to_rgba(color, alpha)
-
-
-def color_list():
-    return [cm.tab20(i) for i in range(20)]
-
-
-def normalize_similarity(NetMatrix, type="association"):
-    D = np.diag(NetMatrix)
-    if type == "association":
-        S = NetMatrix / np.outer(D, D)
-    elif type == "inclusion":
-        S = NetMatrix / np.minimum.outer(D, D)
-    elif type == "jaccard":
-        S = NetMatrix / (np.outer(D, D) + NetMatrix - NetMatrix)
-    elif type == "salton":
-        S = NetMatrix / np.sqrt(np.outer(D, D))
-    elif type == "equivalence":
-        S = (NetMatrix / np.sqrt(np.outer(D, D))) ** 2
-    else:
-        raise ValueError(f"Unknown normalization type: {type}")
-    
-    S = np.nan_to_num(S)
-    return S
+            mat = NetMatrix
+        import numpy as np
+        mat = np.array(mat, dtype=float)
+        np.fill_diagonal(mat, 0)
+        g = ig.Graph.Weighted_Adjacency(mat.tolist(), mode="undirected", attr="weight", loops=False)
+        g.vs["color"] = ["#4B9CD3"] * g.vcount()
+        g.vs["name"] = list(NetMatrix.columns) if hasattr(NetMatrix, "columns") else [str(i) for i in range(g.vcount())]
+        layout = g.layout("fr")
+        coords = layout.coords
+        edge_x, edge_y = [], []
+        for e in g.es:
+            x0, y0 = coords[e.source]
+            x1, y1 = coords[e.target]
+            edge_x += [x0, x1, None]
+            edge_y += [y0, y1, None]
+        node_x = [c[0] for c in coords]
+        node_y = [c[1] for c in coords]
+        labels_list = NetMatrix.columns.tolist() if hasattr(NetMatrix, "columns") else list(range(len(node_x)))
+        fig = go.Figure()
+        fig.add_trace(go.Scatter(x=edge_x, y=edge_y, mode="lines", line=dict(width=0.5, color="#888"), hoverinfo="none"))
+        fig.add_trace(go.Scatter(x=node_x, y=node_y, mode="markers+text", text=labels_list, textposition="top center",
+                                 marker=dict(size=size*2, color="blue"), hoverinfo="text"))
+        fig.update_layout(title=Title, showlegend=False, height=600,
+                         xaxis=dict(showgrid=False, zeroline=False, showticklabels=False),
+                         yaxis=dict(showgrid=False, zeroline=False, showticklabels=False))
+        try:
+            community = g.community_walktrap(weights="weight").as_clustering()
+        except:
+            community = g.community_fastgreedy(weights="weight").as_clustering()
+        return {"graph": g, "layout": layout, "fig": fig, "labels": labels_list, "cluster_obj": community, "NetMatrix": NetMatrix, "cluster_res": None, "S": mat, "color": None}
+    except Exception as ex:
+        print(f"network_plot error: {ex}")
+        return None
 
 
-def rgba_to_hex(rgba):
-    r, g, b, a = rgba
-    return '#{:02X}{:02X}{:02X}'.format(int(r * 255), int(g * 255), int(b * 255))
diff --git a/www/services/standardizer.py b/www/services/standardizer.py
new file mode 100644
index 000000000..8ef196f09
--- /dev/null
+++ b/www/services/standardizer.py
@@ -0,0 +1,29 @@
+import pandas as pd
+from services.etl.extractors import fetch_pubmed, fetch_openalex
+from services.etl.transformers import transform
+from services.etl.validators import validate, print_report
+
+
+def convert2df(query: str, source: str = "pubmed", max_results: int = 100,
+               verbose: bool = True) -> pd.DataFrame:
+
+    source = source.lower().strip()
+
+    if source == "pubmed":
+        df = fetch_pubmed(query, max_results)
+    elif source == "openalex":
+        df = fetch_openalex(query, max_results)
+    else:
+        raise ValueError(f"Unknown source: '{source}'. Choose 'pubmed' or 'openalex'.")
+
+    if df.empty:
+        print("No results found.")
+        return df
+
+    df = transform(df)
+
+    result = validate(df)
+    if verbose:
+        print_report(result)
+
+    return df
diff --git a/www/services/termextraction.py b/www/services/termextraction.py
index f7d9a52c1..687cc318c 100644
--- a/www/services/termextraction.py
+++ b/www/services/termextraction.py
@@ -20,7 +20,7 @@ def term_extraction(df, field="TI", ngrams=1, stemming=False, language="english"
     Returns:
         A DataFrame with the extracted terms.
     """
-    M = df.get()
+    M = df
 
     # Load and update stopwords
     overall_start_time = time.time()
@@ -98,6 +98,6 @@ def term_extraction(df, field="TI", ngrams=1, stemming=False, language="english"
         print(terms_df.sum().sort_values(ascending=False).head(25))
 
     # Finalize the output
-    df.set(M)
+    df = M
 
     return df
diff --git a/www/services/thematicmap.py b/www/services/thematicmap.py
index 3c313b7f6..d585ed2bc 100644
--- a/www/services/thematicmap.py
+++ b/www/services/thematicmap.py
@@ -1,13 +1,14 @@
 from .utils import *
 from .igraph2vis import *
 from .termextraction import *
+from .networkplot import network_plot
 from .biblionetwork import *
 
 
 def thematic_map(df, field="ID", n=250, minfreq=5, ngrams=1, stemming=False, size=0.5, n_labels=1, community_repulsion=0.1, repel=True, remove_terms=None, synonyms=None, cluster="walktrap", subgraphs=False):
         # df = metaTagExtraction(df, field=field)
         M = df
-        m = df.get()
+        m = df
 
         # Set ngrams based on field
         ngrams = int(ngrams) if field in ['TI', 'AB'] else 1
@@ -41,7 +42,7 @@ def thematic_map(df, field="ID", n=250, minfreq=5, ngrams=1, stemming=False, siz
         S = Net['S']
 
         # Set row and column names to lowercase
-        NetMatrix.index = NetMatrix.columns = NetMatrix.index.str.lower()
+        NetMatrix.index = NetMatrix.columns = NetMatrix.index.astype(str).str.lower()
 
         # Get graph and clusters
         net = Net['graph']
@@ -91,7 +92,7 @@ def thematic_map(df, field="ID", n=250, minfreq=5, ngrams=1, stemming=False, siz
 
         # Explode both words and sC columns to create rows for each word and its occurrence count
         df_lab = df_lab.assign(
-            words=df_lab['words'].str.split(', '),
+            words=df_lab['words'].astype(str).str.split(', '),
             sC=df_lab['sC']  # Keep sC as is since it's already a list
         ).explode(['words', 'sC']).reset_index(drop=True)
 
@@ -101,7 +102,7 @@ def thematic_map(df, field="ID", n=250, minfreq=5, ngrams=1, stemming=False, siz
         sEij = triu(sEij.values)
         
         df_lab_top = df_lab[['words', 'groups']].reset_index(drop=True)
-        df_lab_top = df_lab_top.assign(words=df_lab_top['words'].str.split(', ')).explode('words').reset_index(drop=True)
+        df_lab_top = df_lab_top.assign(words=df_lab_top['words'].astype(str).str.split(', ')).explode('words').reset_index(drop=True)
 
         # Create edge list dataframe
         sEij_df = pd.DataFrame(sEij, index=index_names, columns=column_names)
@@ -125,13 +126,15 @@ def thematic_map(df, field="ID", n=250, minfreq=5, ngrams=1, stemming=False, siz
                        left_on='words2', 
                        right_on='words', 
                        how='left',
-                       suffixes=('', '2'))
+                       suffixes=('', '_2'))
         
         # Drop the extra 'words' columns created by the merge
-        sEij_df = sEij_df.drop(['words', 'words_y'], axis=1, errors='ignore')
+        sEij_df = sEij_df.drop(['words_x', 'words_y', 'words'], axis=1, errors='ignore').rename(columns={'groups_2': 'groups2'})
 
         # Get top row for each group
-        df_lab_top = (df_lab[['groups', 'cluster_label', 'color', 'freq']]
+        # Rebuild df_lab_top from available columns
+        available_cols = [c for c in ['groups', 'cluster_label', 'color', 'freq'] if c in df_lab.columns]
+        df_lab_top = (df_lab[available_cols]
                   .groupby('groups')
                   .first()
                   .reset_index())
@@ -140,9 +143,9 @@ def thematic_map(df, field="ID", n=250, minfreq=5, ngrams=1, stemming=False, siz
         sEij_df = sEij_df.loc[:, ~sEij_df.columns.duplicated()]
         
         # Clean the words column by splitting on newlines and taking first value
-        df_lab['words'] = df_lab['words'].str.split('\n').str[0]
+        df_lab['words'] = df_lab['words'].astype(str).str.split('\n').str[0]
         # Clean up words by removing leading numbers and whitespace
-        df_lab['words'] = df_lab['words'].str.replace(r'^\s*\d+\s*', '', regex=True).str.strip()
+        df_lab['words'] = df_lab['words'].astype(str).str.replace(r'^\s*\d+\s*', '', regex=True).str.strip()
 
         df = sEij_df[
                 sEij_df['words1'].isin(df_lab['words'].unique()) & 
@@ -160,7 +163,9 @@ def thematic_map(df, field="ID", n=250, minfreq=5, ngrams=1, stemming=False, siz
         ]
 
         if filtered_df.empty:
-            raise ValueError("Il filtro ha eliminato tutte le righe! Controlla i dati in df_lab['words'] e sEij_df['words1', 'words2'].")
+            import warnings
+            warnings.warn("Not enough data for thematic map analysis. Try with more documents or lower minfreq.")
+            return None
 
         # 3. Filtra correttamente i dati
         df = (
@@ -252,7 +257,7 @@ def thematic_map(df, field="ID", n=250, minfreq=5, ngrams=1, stemming=False, siz
                     top_words = (df_lab[df_lab['groups'] == cluster_id]
                         .sort_values('sC', ascending=False)
                         .head(3)['words']
-                        .str.lower()
+                        .astype(str).str.lower()
                         .tolist())
                     top_words_text = '\n'.join(top_words)
 
@@ -618,18 +623,16 @@ def cluster_assignment(M, words, field, remove_terms=None, synonyms=None, thresh
     # Merge terms with words
     # Convert 'terms' to string before applying string operations
     all_field['terms'] = all_field['terms'].astype(str)
-    terms = all_field.assign(terms=all_field['terms'].str.lower()).merge(
+    terms = all_field.assign(terms=all_field['terms'].astype(str).str.lower()).merge(
         words_for_merge, left_on='terms', right_on='Words', how='left'
     )
 
     # Calculate probabilities
-    terms = (terms.groupby('SR')
-        .apply(lambda x: x.assign(pagerank=x['p_c'].sum()))
-        .reset_index(drop=True)
-        .groupby(['SR', 'Cluster_Label'])
-        .agg({'p_w': 'sum', 'p_c': 'max'})
-        .reset_index()
-        .rename(columns={'p_c': 'pagerank'}))
+    terms['pagerank'] = terms.groupby('SR')['p_c'].transform('sum')
+    terms = (terms.groupby(['SR', 'Cluster_Label'], as_index=False)
+        .agg({'p_w': 'sum', 'p_c': 'max', 'pagerank': 'first'})
+        .rename(columns={'p_c': 'pagerank_c'}))
+    terms = terms.rename(columns={'pagerank_c': 'pagerank'})
 
     terms['p'] = terms['p_w'] / terms.groupby('SR')['p_w'].transform('sum')
     terms = terms.dropna(subset=['Cluster_Label']).drop('p_w', axis=1)
diff --git a/www/utils/__init__.py b/www/utils/__init__.py
new file mode 100644
index 000000000..e69de29bb
diff --git a/www/utils/config_loader.py b/www/utils/config_loader.py
new file mode 100644
index 000000000..8fdc1a225
--- /dev/null
+++ b/www/utils/config_loader.py
@@ -0,0 +1,8 @@
+import yaml
+import os
+
+def load_config(config_path="config.yaml"):
+    if not os.path.exists(config_path):
+        return {"extraction": {"query": "bibliometrics", "max_results": 10}, "paths": {"output_csv": "output.csv"}}
+    with open(config_path, "r") as f:
+        return yaml.safe_load(f)
\ No newline at end of file