Check institution frequencies
parent
9416a1c8b6
commit
0549d0f55f
@ -0,0 +1,14 @@
|
||||
#%% Compare the frequency of the inst. names with the wos-analysis on the web interface
|
||||
import pandas as pd
|
||||
|
||||
# %%
|
||||
wos_inst_df = pd.read_excel("../wos_processed_data/wos_institution_locations_harmonized.xlsx")
|
||||
|
||||
# %% Get rid of the duplicate institution name entries in each individual publication
|
||||
wos_inst_df["id_inst"] = wos_inst_df['Institution'] + ";" + wos_inst_df["UT (Unique WOS ID)"]
|
||||
wos_pubunique_inst = wos_inst_df["id_inst"].unique()
|
||||
wos_pubunique_inst = [x.split(";")[0] for x in wos_pubunique_inst]
|
||||
|
||||
# %% Calc. frequencies, and get an output
|
||||
wos_inst_freqdf = pd.DataFrame(wos_pubunique_inst).value_counts().rename_axis('institution').reset_index(name='frequency')
|
||||
wos_inst_freqdf.to_csv("../wos_processed_data/wos_pubunique-institution_frequency.csv", index=False)
|
Binary file not shown.
|
Binary file not shown.
Loading…
Reference in New Issue