This file contains ambiguous Unicode characters that may be confused with others in your current locale. If your use case is intentional and legitimate, you can safely ignore this warning. Use the Escape button to highlight these characters.
"# return \"; \".join([i[0].upper() for i in keywords])\n",
"#\n",
"# kwd_extract(text=\"Artificial Intelligence: New Frontiers in Real-Time Inverse Scattering and Electromagnetic Imaging - In recent years, artificial intelligence (AI) techniques have been developed rapidly. With the ...\")"
"text/plain": " UT (Unique WOS ID) Country Country_Type \n0 WOS:000208863600266 China China \\\n6 WOS:000209236900010 China China \n7 WOS:000209236900010 China China \n8 WOS:000209236900010 France EU \n10 WOS:000209236900010 Germany EU \n... ... ... ... \n321236 WOS:000953367000001 China China \n321237 WOS:000953367000001 China China \n321238 WOS:000953367000001 China China \n321239 WOS:000953367000001 China China \n321241 WOS:000953367000001 United Kingdom Non-EU associate \n\n author_str_id \n0 5dfb4f0408a2cc8b7f36f5516938b62c \n6 b406b8485c286091a46aca4999f294d3 \n7 abf37b879540b7c2eeb86787a467de29 \n8 2c559a54c654ab6dbc23d20ae82a0501 \n10 2c559a54c654ab6dbc23d20ae82a0501 \n... ... \n321236 99ef5c82ba66e07f9aa2d3f9fc7c45f7 \n321237 d013bf53d094540f90db9224b3eb9922 \n321238 702962f6fe47bac08520ae556a8e0e02 \n321239 99ef5c82ba66e07f9aa2d3f9fc7c45f7 \n321241 9cc42be570a5464bca0ea4b6b39d0271 \n\n[277884 rows x 4 columns]",
"text/plain": " UT (Unique WOS ID) Country Country_Type \n0 WOS:000208863600266 China China \\\n299168 WOS:000840488600001 China China \n299169 WOS:000840488600001 China China \n101376 WOS:000434663200012 China China \n101374 WOS:000434663200012 China China \n\n author_str_id \n0 5dfb4f0408a2cc8b7f36f5516938b62c \n299168 3462304c908993a828cdd0ff91ea4aaa \n299169 68ab59c442eb882af13a8273439cf840 \n101376 304c36b8b677f41a489894dc66a8461c \n101374 c04795fe195dcadb58bed5c81125ea35 ",
"text/plain": "Affiliations\nCHINESE ACADEMY OF SCIENCES 2688\nUNIVERSITY OF LONDON 1251\nUDICE-FRENCH RESEARCH UNIVERSITIES 1038\nCENTRE NATIONAL DE LA RECHERCHE SCIENTIFIQUE (CNRS) 978\nTSINGHUA UNIVERSITY 960\n ... \nITALIAN INSTITUTE FOR GENOMIC MEDICINE (IIGM) 1\nSHENYANG INSTITUTE OF ENGINEERING 1\nXIANYANG NORMAL UNIVERSITY 1\nAGILENT TECHNOLOGIES 1\nUNIVERSIDAD DE ESPECIALIDADES ESPIRITU SANTO 1\nName: count, Length: 6117, dtype: int64"
},
"execution_count": 67,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"affiliations[\"Affiliations\"].value_counts()"
],
"metadata": {
"collapsed": false
}
},
{
"cell_type": "code",
"execution_count": 68,
"outputs": [
{
"data": {
"text/plain": "Institution\n Chinese Acad Sci 2708\n Tsinghua Univ 1170\n Shanghai Jiao Tong Univ 978\n Zhejiang Univ 902\n Univ Chinese Acad Sci 753\n ... \n Univ Namur 1\n Qianhai Inst Innovat Res 1\n UN 1\n Vienna Int Ctr 1\n Engn Res Ctr Urban Underground Space Dev Zhejiang 1\nName: count, Length: 11670, dtype: int64"
"mode_final.columns = [\"Affiliations\",\"Institution (short name from address)\",\"Country_candidate\",\"City_candidate\",\"Country_type_candidate\"]\n",
"# group = ['Publication Year','Domain_English']\n",
"# data = wos.groupby(group, as_index=False)[record_col].nunique().sort_values(ascending=False, by=group+[record_col])\n",
"# data"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": [
"# group = ['Publication Year','Domain_English']\n",
"# data = wos.groupby(group)[record_col].nunique().unstack(fill_value=0).stack().reset_index().rename(columns={0:record_col}).sort_values(ascending=False, by=group+[record_col])\n",