{ "cells": [ { "cell_type": "code", "execution_count": 1, "metadata": { "collapsed": true }, "outputs": [], "source": [ "import os\n", "import pandas as pd\n", "import janitor\n", "import matplotlib.pyplot as plt\n", "import seaborn as sns\n", "from matplotlib.ticker import MaxNLocator\n", "import math\n", "%matplotlib inline" ] }, { "cell_type": "code", "execution_count": 3, "outputs": [], "source": [ "outdir=\"WESTERN_CH_scope\"\n", "\n", "appln = pd.read_csv(f\"{outdir}/tls_201_scope.csv\")\n", "\n", "appln_title = pd.read_csv(f\"{outdir}/tls_202_scope.csv\")\n", "\n", "pers = pd.read_csv(f\"{outdir}/tls_206_scope.csv\")\n", "pers['psn_sector'] = pers['psn_sector'].fillna(\"UNKNOWN\")\n", "\n", "appln_pers = pd.read_csv(f\"{outdir}/tls_207_scope.csv\")\n", "\n", "appln_cpc = pd.read_csv(f\"{outdir}/tls_224_scope.csv\")" ], "metadata": { "collapsed": false } }, { "cell_type": "code", "execution_count": 5, "outputs": [ { "data": { "text/plain": "203873" }, "execution_count": 5, "metadata": {}, "output_type": "execute_result" } ], "source": [ "len(appln)" ], "metadata": { "collapsed": false } }, { "cell_type": "code", "execution_count": 7, "outputs": [ { "data": { "text/plain": " appln_id appln_title_lg \n106316 498640253 en \\\n119852 511974583 en \n193586 577006640 en \n172207 556318748 en \n117620 509549284 en \n... ... ... \n58791 448189845 en \n119362 511604550 en \n73722 471815906 en \n45133 438311946 en \n25978 414431520 en \n\n appln_title \n106316 DRAIN CLEANING DEVICE \n119852 Antenna panel switching and beam indication \n193586 Loft bed \n172207 Winch for Securing a Load \n117620 TEMPERATURE CONTROL APPARATUS FORELECTRIC VEHI... \n... ... \n58791 Collaborative spectrum sensing in cognitive ra... \n119362 CLIP-ON GLASSES WITH REPLACEABLE LENS \n73722 Sensitized, photo-sensitive glass and its prod... \n45133 PREPARATION OF 3,4-DIHYDRO-1,4-BENZOXAZEPIN-5(... \n25978 - CRYSTAL OSCILLATOR WITH LOW-POWER MODE \n\n[100 rows x 3 columns]", "text/html": "
\n | appln_id | \nappln_title_lg | \nappln_title | \n
---|---|---|---|
106316 | \n498640253 | \nen | \nDRAIN CLEANING DEVICE | \n
119852 | \n511974583 | \nen | \nAntenna panel switching and beam indication | \n
193586 | \n577006640 | \nen | \nLoft bed | \n
172207 | \n556318748 | \nen | \nWinch for Securing a Load | \n
117620 | \n509549284 | \nen | \nTEMPERATURE CONTROL APPARATUS FORELECTRIC VEHI... | \n
... | \n... | \n... | \n... | \n
58791 | \n448189845 | \nen | \nCollaborative spectrum sensing in cognitive ra... | \n
119362 | \n511604550 | \nen | \nCLIP-ON GLASSES WITH REPLACEABLE LENS | \n
73722 | \n471815906 | \nen | \nSensitized, photo-sensitive glass and its prod... | \n
45133 | \n438311946 | \nen | \nPREPARATION OF 3,4-DIHYDRO-1,4-BENZOXAZEPIN-5(... | \n
25978 | \n414431520 | \nen | \n- CRYSTAL OSCILLATOR WITH LOW-POWER MODE | \n
100 rows × 3 columns
\n\n | appln_id | \nappln_auth | \nappln_nr | \nappln_kind | \nappln_filing_date | \nappln_filing_year | \nappln_nr_original | \nipr_type | \nreceiving_office | \ninternat_appln_id | \n... | \nearliest_pat_publn_id | \ngranted | \ndocdb_family_id | \ninpadoc_family_id | \ndocdb_family_size | \nnb_citing_docdb_fam | \nnb_applicants | \nnb_inventors | \nappln_title_lg | \nappln_title | \n
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n330225325 | \nEP | \n11150195 | \nA | \n2011-01-05 | \n2011 | \n11150195 | \nPI | \n\n | 0 | \n... | \n335277427 | \nY | \n43754737 | \n330225325 | \n4 | \n16 | \n1 | \n1 | \nen | \nBeverage preparation machine | \n
1 | \n330225397 | \nEP | \n11150231 | \nA | \n2011-01-05 | \n2011 | \n11150231 | \nPI | \n\n | 0 | \n... | \n335277736 | \nY | \n43619902 | \n330225397 | \n6 | \n56 | \n1 | \n9 | \nen | \nScrewdriving tool having a driving tool with a... | \n
2 | \n330322632 | \nEP | \n11150485 | \nA | \n2011-01-10 | \n2011 | \n11150485 | \nPI | \n\n | 0 | \n... | \n364719889 | \nY | \n43991052 | \n330322632 | \n2 | \n5 | \n1 | \n2 | \nen | \nMethod and system for recommending contextual ... | \n
3 | \n330326785 | \nEP | \n11150605 | \nA | \n2011-01-11 | \n2011 | \n11150605 | \nPI | \n\n | 0 | \n... | \n335277720 | \nN | \n43023665 | \n328518903 | \n6 | \n9 | \n1 | \n3 | \nen | \nApparatus and method for continuous casting of... | \n
4 | \n330350961 | \nEP | \n11150683 | \nA | \n2011-01-12 | \n2011 | \n11150683 | \nPI | \n\n | 0 | \n... | \n364923578 | \nN | \n43881056 | \n330350961 | \n7 | \n13 | \n2 | \n5 | \nen | \nA method and an apparatus for treating at leas... | \n
5 rows × 28 columns
\n\n | person_id | \nappln_id | \napplt_seq_nr | \ninvt_seq_nr | \n
---|---|---|---|---|
0 | \n1 | \n340314532 | \n1 | \n0 | \n
1 | \n1 | \n413601768 | \n1 | \n0 | \n
2 | \n21 | \n332015605 | \n1 | \n0 | \n
3 | \n21 | \n333490084 | \n1 | \n0 | \n
4 | \n21 | \n335903805 | \n1 | \n0 | \n
... | \n... | \n... | \n... | \n... | \n
274039 | \n85719932 | \n545918634 | \n0 | \n2 | \n
274040 | \n85720336 | \n569409547 | \n0 | \n4 | \n
274041 | \n85720376 | \n555215896 | \n0 | \n2 | \n
274042 | \n85720469 | \n569304088 | \n0 | \n5 | \n
274043 | \n85720500 | \n569495993 | \n0 | \n5 | \n
274044 rows × 4 columns
\n\n | person_id | \nperson_name | \nperson_name_orig_lg | \nperson_address | \nperson_ctry_code | \nnuts | \nnuts_level | \ndoc_std_name_id | \ndoc_std_name | \npsn_id | \npsn_name | \npsn_level | \npsn_sector | \nhan_id | \nhan_name | \nhan_harmonized | \npsn_sector_primary | \n
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n1 | \nNokia Corporation | \nNokia Corporation | \nKeilalahdentie 4,02150 Espoo | \nFI | \nFI1B1 | \n3 | \n1 | \nNOKIA CORP | \n23782051 | \nNOKIA CORPORATION | \n2 | \nCOMPANY | \n2125445 | \nNOKIA CORP | \n2 | \nCOMPANY | \n
1 | \n128 | \nNokia Siemens Networks Oy | \nNokia Siemens Networks Oy | \nKaraportti 3,02610 Espoo | \nFI | \nFI1B1 | \n3 | \n112 | \nNOKIA SIEMENS NETWORKS OY | \n23782129 | \nNOKIA NETWORKS | \n2 | \nCOMPANY | \n2125445 | \nNOKIA CORP | \n2 | \nCOMPANY | \n
2 | \n5217785 | \nNokia Corporation | \nNokia Corporation | \nEspoo | \nFI | \nFI | \n0 | \n1 | \nNOKIA CORP | \n23782051 | \nNOKIA CORPORATION | \n2 | \nCOMPANY | \n2125445 | \nNOKIA CORP | \n2 | \nCOMPANY | \n
3 | \n5217811 | \nNokia Corporation | \nNokia Corporation | \nNaN | \nFI | \nFI | \n0 | \n1 | \nNOKIA CORP | \n23782051 | \nNOKIA CORPORATION | \n2 | \nCOMPANY | \n2125445 | \nNOKIA CORP | \n2 | \nCOMPANY | \n
4 | \n5232170 | \nNokia Siemens Networks Oy | \nNokia Siemens Networks Oy | \nEspoo | \nFI | \nFI | \n0 | \n112 | \nNOKIA SIEMENS NETWORKS OY | \n23782129 | \nNOKIA NETWORKS | \n2 | \nCOMPANY | \n2125445 | \nNOKIA CORP | \n2 | \nCOMPANY | \n
... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n
112235 | \n85719932 | \nVIKSTREM, Erik | \nВИКСТРЁМ, Эрик | \nNaN | \nSE | \nSE | \n0 | \n38919340 | \nVIKSTREM ERIK | \n185719932 | \nVIKSTREM, Erik | \n0 | \nUNKNOWN | \n185719932 | \nVIKSTREM, Erik | \n0 | \nUNKNOWN | \n
112236 | \n85720336 | \nHWANG, LING-CHI | \nHWANG, LING-CHI | \nNaN | \nTW | \nNaN | \n9 | \n35599384 | \nHWANG LING-CHI | \n185720336 | \nHWANG, LING-CHI | \n0 | \nUNKNOWN | \n185720336 | \nHWANG, LING-CHI | \n0 | \nUNKNOWN | \n
112237 | \n85720376 | \nLI, I Chan | \nLI, I Chan | \nNaN | \nTW | \nNaN | \n9 | \n38707281 | \nLI I CHAN | \n185720376 | \nLI, I Chan | \n0 | \nUNKNOWN | \n185720376 | \nLI, I Chan | \n0 | \nUNKNOWN | \n
112238 | \n85720469 | \nTING, Chia Ching | \nTING, Chia Ching | \nTW | \nTW | \nNaN | \n9 | \n23937900 | \nTING CHIA CHING | \n185720469 | \nTING, Chia Ching | \n0 | \nUNKNOWN | \n185720469 | \nTING, Chia Ching | \n0 | \nUNKNOWN | \n
112239 | \n85720500 | \nWANG, YU-CHEIH | \nWANG, YU-CHEIH | \nNaN | \nTW | \nNaN | \n9 | \n38204835 | \nWANG YU-CHEIH | \n185720500 | \nWANG, YU-CHEIH | \n0 | \nUNKNOWN | \n185720500 | \nWANG, YU-CHEIH | \n0 | \nUNKNOWN | \n
112240 rows × 17 columns
\n\n | han_id | \npsn_sector_primary | \n
---|---|---|
0 | \n264 | \nGOV NON-PROFIT UNIVERSITY | \n
1 | \n627 | \nCOMPANY | \n
2 | \n974 | \nCOMPANY | \n
3 | \n1480 | \nCOMPANY | \n
4 | \n1699 | \nCOMPANY | \n
... | \n... | \n... | \n
106154 | \n185719932 | \nUNKNOWN | \n
106155 | \n185720336 | \nUNKNOWN | \n
106156 | \n185720376 | \nUNKNOWN | \n
106157 | \n185720469 | \nUNKNOWN | \n
106158 | \n185720500 | \nUNKNOWN | \n
106159 rows × 2 columns
\n