{ "cells": [ { "cell_type": "code", "execution_count": 5, "metadata": { "collapsed": true }, "outputs": [], "source": [ "import os\n", "import pandas as pd\n", "import janitor\n", "import matplotlib.pyplot as plt\n", "import seaborn as sns\n", "from matplotlib.ticker import MaxNLocator\n", "import math\n", "%matplotlib inline" ] }, { "cell_type": "code", "execution_count": 33, "outputs": [], "source": [ "outdir=\"EU_CH_scope/v2_\"\n", "\n", "appln = pd.read_csv(f\"{outdir}/tls_201_scope.csv\")\n", "\n", "appln_title = pd.read_csv(f\"{outdir}/tls_202_scope.csv\")\n", "\n", "pers = pd.read_csv(f\"{outdir}/tls_206_scope.csv\")\n", "pers['psn_sector'] = pers['psn_sector'].fillna(\"UNKNOWN\")\n", "\n", "appln_pers = pd.read_csv(f\"{outdir}/tls_207_scope.csv\")\n", "\n", "appln_cpc = pd.read_csv(f\"{outdir}/tls_224_scope.csv\")" ], "metadata": { "collapsed": false } }, { "cell_type": "code", "execution_count": 23, "outputs": [ { "data": { "text/plain": " appln_id appln_auth appln_nr appln_kind appln_filing_date \n0 330225325 EP 11150195 A 2011-01-05 \\\n1 330322632 EP 11150485 A 2011-01-10 \n2 330350961 EP 11150683 A 2011-01-12 \n3 330374780 WO 2011050339 W 2011-01-12 \n4 330424360 WO 2011050199 W 2011-01-10 \n... ... ... ... ... ... \n64261 575551871 WO 2020142401 W 2020-12-31 \n64262 575551946 WO 2020142230 W 2020-12-31 \n64263 575553943 WO 2021142692 W 2021-12-29 \n64264 575553975 WO 2021142655 W 2021-12-29 \n64265 575556091 WO 2021064274 W 2021-12-20 \n\n appln_filing_year appln_nr_original ipr_type receiving_office \n0 2011 11150195 PI \\\n1 2011 11150485 PI \n2 2011 11150683 PI \n3 2011 EP2011/050339 PI EP \n4 2011 EP2011/050199 PI EP \n... ... ... ... ... \n64261 2020 CN2020/142401 PI CN \n64262 2020 CN2020/142230 PI CN \n64263 2021 CN2021/142692 PI CN \n64264 2021 CN2021/142655 PI CN \n64265 2021 US2021/064274 PI US \n\n internat_appln_id ... earliest_publn_date earliest_publn_year \n0 0 ... 2011-07-13 2011 \\\n1 0 ... 2012-07-11 2012 \n2 0 ... 2012-07-18 2012 \n3 0 ... 2011-07-21 2011 \n4 0 ... 2012-07-19 2012 \n... ... ... ... ... \n64261 0 ... 2022-07-07 2022 \n64262 0 ... 2022-07-07 2022 \n64263 0 ... 2022-07-07 2022 \n64264 0 ... 2022-07-07 2022 \n64265 0 ... 2022-07-07 2022 \n\n earliest_pat_publn_id granted docdb_family_id inpadoc_family_id \n0 335277427 Y 43754737 330225325 \\\n1 364719889 Y 43991052 330322632 \n2 364923578 N 43881056 330350961 \n3 335927718 N 43923624 330374780 \n4 365345607 N 43533009 330424360 \n... ... ... ... ... \n64261 575551872 N 82260109 575551871 \n64262 575551947 N 82260125 575551946 \n64263 575553944 N 79460210 564546189 \n64264 575553976 N 82260272 575553975 \n64265 575556092 N 82132815 575038927 \n\n docdb_family_size nb_citing_docdb_fam nb_applicants nb_inventors \n0 4 16 1 1 \n1 2 5 1 2 \n2 7 12 2 5 \n3 2 8 5 4 \n4 4 13 3 2 \n... ... ... ... ... \n64261 1 0 2 1 \n64262 1 0 3 3 \n64263 2 0 2 6 \n64264 1 0 2 7 \n64265 2 0 4 7 \n\n[64266 rows x 26 columns]", "text/html": "
\n | appln_id | \nappln_auth | \nappln_nr | \nappln_kind | \nappln_filing_date | \nappln_filing_year | \nappln_nr_original | \nipr_type | \nreceiving_office | \ninternat_appln_id | \n... | \nearliest_publn_date | \nearliest_publn_year | \nearliest_pat_publn_id | \ngranted | \ndocdb_family_id | \ninpadoc_family_id | \ndocdb_family_size | \nnb_citing_docdb_fam | \nnb_applicants | \nnb_inventors | \n
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n330225325 | \nEP | \n11150195 | \nA | \n2011-01-05 | \n2011 | \n11150195 | \nPI | \n\n | 0 | \n... | \n2011-07-13 | \n2011 | \n335277427 | \nY | \n43754737 | \n330225325 | \n4 | \n16 | \n1 | \n1 | \n
1 | \n330322632 | \nEP | \n11150485 | \nA | \n2011-01-10 | \n2011 | \n11150485 | \nPI | \n\n | 0 | \n... | \n2012-07-11 | \n2012 | \n364719889 | \nY | \n43991052 | \n330322632 | \n2 | \n5 | \n1 | \n2 | \n
2 | \n330350961 | \nEP | \n11150683 | \nA | \n2011-01-12 | \n2011 | \n11150683 | \nPI | \n\n | 0 | \n... | \n2012-07-18 | \n2012 | \n364923578 | \nN | \n43881056 | \n330350961 | \n7 | \n12 | \n2 | \n5 | \n
3 | \n330374780 | \nWO | \n2011050339 | \nW | \n2011-01-12 | \n2011 | \nEP2011/050339 | \nPI | \nEP | \n0 | \n... | \n2011-07-21 | \n2011 | \n335927718 | \nN | \n43923624 | \n330374780 | \n2 | \n8 | \n5 | \n4 | \n
4 | \n330424360 | \nWO | \n2011050199 | \nW | \n2011-01-10 | \n2011 | \nEP2011/050199 | \nPI | \nEP | \n0 | \n... | \n2012-07-19 | \n2012 | \n365345607 | \nN | \n43533009 | \n330424360 | \n4 | \n13 | \n3 | \n2 | \n
... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n
64261 | \n575551871 | \nWO | \n2020142401 | \nW | \n2020-12-31 | \n2020 | \nCN2020/142401 | \nPI | \nCN | \n0 | \n... | \n2022-07-07 | \n2022 | \n575551872 | \nN | \n82260109 | \n575551871 | \n1 | \n0 | \n2 | \n1 | \n
64262 | \n575551946 | \nWO | \n2020142230 | \nW | \n2020-12-31 | \n2020 | \nCN2020/142230 | \nPI | \nCN | \n0 | \n... | \n2022-07-07 | \n2022 | \n575551947 | \nN | \n82260125 | \n575551946 | \n1 | \n0 | \n3 | \n3 | \n
64263 | \n575553943 | \nWO | \n2021142692 | \nW | \n2021-12-29 | \n2021 | \nCN2021/142692 | \nPI | \nCN | \n0 | \n... | \n2022-07-07 | \n2022 | \n575553944 | \nN | \n79460210 | \n564546189 | \n2 | \n0 | \n2 | \n6 | \n
64264 | \n575553975 | \nWO | \n2021142655 | \nW | \n2021-12-29 | \n2021 | \nCN2021/142655 | \nPI | \nCN | \n0 | \n... | \n2022-07-07 | \n2022 | \n575553976 | \nN | \n82260272 | \n575553975 | \n1 | \n0 | \n2 | \n7 | \n
64265 | \n575556091 | \nWO | \n2021064274 | \nW | \n2021-12-20 | \n2021 | \nUS2021/064274 | \nPI | \nUS | \n0 | \n... | \n2022-07-07 | \n2022 | \n575556092 | \nN | \n82132815 | \n575038927 | \n2 | \n0 | \n4 | \n7 | \n
64266 rows × 26 columns
\n\n | appln_id | \nappln_title_lg | \nappln_title | \n
---|---|---|---|
0 | \n330225325 | \nen | \nBeverage preparation machine | \n
1 | \n330322632 | \nen | \nMethod and system for recommending contextual ... | \n
2 | \n330350961 | \nen | \nA method and an apparatus for treating at leas... | \n
3 | \n330374780 | \nen | \nA METHOD FOR DIAGNOSIS OF FAULT IN VEHICULAR W... | \n
4 | \n330424360 | \nen | \nERROR CONTROL IN A COMMUNICATION SYSTEM | \n
... | \n... | \n... | \n... | \n
64258 | \n575551871 | \nen | \nIMAGE STITCHING METHOD AND APPARATUS, AND COMP... | \n
64259 | \n575551946 | \nen | \nLOW VOC AND FOOD GRADE RESEALABLE LABEL | \n
64260 | \n575553943 | \nen | \nMETHOD, DEVICE, COMPUTER READABLE MEDIUM, AND ... | \n
64261 | \n575553975 | \nen | \nMULTISPECIFIC ANTIGEN BINDING PROTEINS | \n
64262 | \n575556091 | \nen | \nSYSTEM AND METHOD FOR METHANE HYDRATE BASED PR... | \n
64263 rows × 3 columns
\n\n | appln_id | \nappln_auth | \nappln_nr | \nappln_kind | \nappln_filing_date | \nappln_filing_year | \nappln_nr_original | \nipr_type | \nreceiving_office | \ninternat_appln_id | \n... | \nearliest_pat_publn_id | \ngranted | \ndocdb_family_id | \ninpadoc_family_id | \ndocdb_family_size | \nnb_citing_docdb_fam | \nnb_applicants | \nnb_inventors | \nappln_title_lg | \nappln_title | \n
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n330225325 | \nEP | \n11150195 | \nA | \n2011-01-05 | \n2011 | \n11150195 | \nPI | \n\n | 0 | \n... | \n335277427 | \nY | \n43754737 | \n330225325 | \n4 | \n16 | \n1 | \n1 | \nen | \nBeverage preparation machine | \n
1 | \n330322632 | \nEP | \n11150485 | \nA | \n2011-01-10 | \n2011 | \n11150485 | \nPI | \n\n | 0 | \n... | \n364719889 | \nY | \n43991052 | \n330322632 | \n2 | \n5 | \n1 | \n2 | \nen | \nMethod and system for recommending contextual ... | \n
2 | \n330350961 | \nEP | \n11150683 | \nA | \n2011-01-12 | \n2011 | \n11150683 | \nPI | \n\n | 0 | \n... | \n364923578 | \nN | \n43881056 | \n330350961 | \n7 | \n12 | \n2 | \n5 | \nen | \nA method and an apparatus for treating at leas... | \n
3 | \n330374780 | \nWO | \n2011050339 | \nW | \n2011-01-12 | \n2011 | \nEP2011/050339 | \nPI | \nEP | \n0 | \n... | \n335927718 | \nN | \n43923624 | \n330374780 | \n2 | \n8 | \n5 | \n4 | \nen | \nA METHOD FOR DIAGNOSIS OF FAULT IN VEHICULAR W... | \n
4 | \n330424360 | \nWO | \n2011050199 | \nW | \n2011-01-10 | \n2011 | \nEP2011/050199 | \nPI | \nEP | \n0 | \n... | \n365345607 | \nN | \n43533009 | \n330424360 | \n4 | \n13 | \n3 | \n2 | \nen | \nERROR CONTROL IN A COMMUNICATION SYSTEM | \n
5 rows × 28 columns
\n\n | person_id | \nappln_id | \napplt_seq_nr | \ninvt_seq_nr | \n
---|---|---|---|---|
0 | \n1 | \n340314532 | \n1 | \n0 | \n
1 | \n1 | \n413601768 | \n1 | \n0 | \n
2 | \n21 | \n332015605 | \n1 | \n0 | \n
3 | \n21 | \n333490084 | \n1 | \n0 | \n
4 | \n21 | \n335903805 | \n1 | \n0 | \n
... | \n... | \n... | \n... | \n... | \n
274039 | \n85719932 | \n545918634 | \n0 | \n2 | \n
274040 | \n85720336 | \n569409547 | \n0 | \n4 | \n
274041 | \n85720376 | \n555215896 | \n0 | \n2 | \n
274042 | \n85720469 | \n569304088 | \n0 | \n5 | \n
274043 | \n85720500 | \n569495993 | \n0 | \n5 | \n
274044 rows × 4 columns
\n\n | person_id | \nperson_name | \nperson_name_orig_lg | \nperson_address | \nperson_ctry_code | \nnuts | \nnuts_level | \ndoc_std_name_id | \ndoc_std_name | \npsn_id | \npsn_name | \npsn_level | \npsn_sector | \nhan_id | \nhan_name | \nhan_harmonized | \npsn_sector_primary | \n
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n1 | \nNokia Corporation | \nNokia Corporation | \nKeilalahdentie 4,02150 Espoo | \nFI | \nFI1B1 | \n3 | \n1 | \nNOKIA CORP | \n23782051 | \nNOKIA CORPORATION | \n2 | \nCOMPANY | \n2125445 | \nNOKIA CORP | \n2 | \nCOMPANY | \n
1 | \n128 | \nNokia Siemens Networks Oy | \nNokia Siemens Networks Oy | \nKaraportti 3,02610 Espoo | \nFI | \nFI1B1 | \n3 | \n112 | \nNOKIA SIEMENS NETWORKS OY | \n23782129 | \nNOKIA NETWORKS | \n2 | \nCOMPANY | \n2125445 | \nNOKIA CORP | \n2 | \nCOMPANY | \n
2 | \n5217785 | \nNokia Corporation | \nNokia Corporation | \nEspoo | \nFI | \nFI | \n0 | \n1 | \nNOKIA CORP | \n23782051 | \nNOKIA CORPORATION | \n2 | \nCOMPANY | \n2125445 | \nNOKIA CORP | \n2 | \nCOMPANY | \n
3 | \n5217811 | \nNokia Corporation | \nNokia Corporation | \nNaN | \nFI | \nFI | \n0 | \n1 | \nNOKIA CORP | \n23782051 | \nNOKIA CORPORATION | \n2 | \nCOMPANY | \n2125445 | \nNOKIA CORP | \n2 | \nCOMPANY | \n
4 | \n5232170 | \nNokia Siemens Networks Oy | \nNokia Siemens Networks Oy | \nEspoo | \nFI | \nFI | \n0 | \n112 | \nNOKIA SIEMENS NETWORKS OY | \n23782129 | \nNOKIA NETWORKS | \n2 | \nCOMPANY | \n2125445 | \nNOKIA CORP | \n2 | \nCOMPANY | \n
... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n
112235 | \n85719932 | \nVIKSTREM, Erik | \nВИКСТРЁМ, Эрик | \nNaN | \nSE | \nSE | \n0 | \n38919340 | \nVIKSTREM ERIK | \n185719932 | \nVIKSTREM, Erik | \n0 | \nUNKNOWN | \n185719932 | \nVIKSTREM, Erik | \n0 | \nUNKNOWN | \n
112236 | \n85720336 | \nHWANG, LING-CHI | \nHWANG, LING-CHI | \nNaN | \nTW | \nNaN | \n9 | \n35599384 | \nHWANG LING-CHI | \n185720336 | \nHWANG, LING-CHI | \n0 | \nUNKNOWN | \n185720336 | \nHWANG, LING-CHI | \n0 | \nUNKNOWN | \n
112237 | \n85720376 | \nLI, I Chan | \nLI, I Chan | \nNaN | \nTW | \nNaN | \n9 | \n38707281 | \nLI I CHAN | \n185720376 | \nLI, I Chan | \n0 | \nUNKNOWN | \n185720376 | \nLI, I Chan | \n0 | \nUNKNOWN | \n
112238 | \n85720469 | \nTING, Chia Ching | \nTING, Chia Ching | \nTW | \nTW | \nNaN | \n9 | \n23937900 | \nTING CHIA CHING | \n185720469 | \nTING, Chia Ching | \n0 | \nUNKNOWN | \n185720469 | \nTING, Chia Ching | \n0 | \nUNKNOWN | \n
112239 | \n85720500 | \nWANG, YU-CHEIH | \nWANG, YU-CHEIH | \nNaN | \nTW | \nNaN | \n9 | \n38204835 | \nWANG YU-CHEIH | \n185720500 | \nWANG, YU-CHEIH | \n0 | \nUNKNOWN | \n185720500 | \nWANG, YU-CHEIH | \n0 | \nUNKNOWN | \n
112240 rows × 17 columns
\n\n | han_id | \npsn_sector_primary | \n
---|---|---|
0 | \n264 | \nGOV NON-PROFIT UNIVERSITY | \n
1 | \n627 | \nCOMPANY | \n
2 | \n974 | \nCOMPANY | \n
3 | \n1480 | \nCOMPANY | \n
4 | \n1699 | \nCOMPANY | \n
... | \n... | \n... | \n
106154 | \n185719932 | \nUNKNOWN | \n
106155 | \n185720336 | \nUNKNOWN | \n
106156 | \n185720376 | \nUNKNOWN | \n
106157 | \n185720469 | \nUNKNOWN | \n
106158 | \n185720500 | \nUNKNOWN | \n
106159 rows × 2 columns
\n