{ "cells": [ { "cell_type": "code", "execution_count": 19, "metadata": { "collapsed": true }, "outputs": [], "source": [ "import os\n", "import pandas as pd\n", "import janitor\n", "import matplotlib.pyplot as plt\n", "import seaborn as sns\n", "from matplotlib.ticker import MaxNLocator\n", "import math\n", "%matplotlib inline" ] }, { "cell_type": "code", "execution_count": 20, "outputs": [], "source": [ "outdir=\"WESTERN_CH_scope\"\n", "\n", "appln = pd.read_csv(f\"{outdir}/tls_201_scope.csv\")\n", "\n", "appln_title = pd.read_csv(f\"{outdir}/tls_202_scope.csv\")\n", "\n", "pers = pd.read_csv(f\"{outdir}/tls_206_scope.csv\")\n", "pers['psn_sector'] = pers['psn_sector'].fillna(\"UNKNOWN\")\n", "\n", "appln_pers = pd.read_csv(f\"{outdir}/tls_207_scope.csv\")\n", "\n", "appln_cpc = pd.read_csv(f\"{outdir}/tls_224_scope.csv\")" ], "metadata": { "collapsed": false } }, { "cell_type": "code", "execution_count": 21, "outputs": [ { "data": { "text/plain": "203873" }, "execution_count": 21, "metadata": {}, "output_type": "execute_result" } ], "source": [ "len(appln)" ], "metadata": { "collapsed": false } }, { "cell_type": "code", "execution_count": 22, "outputs": [ { "data": { "text/plain": " appln_id appln_title_lg \n6613 365740889 en \\\n15307 405955962 en \n34917 420680979 en \n65975 456943983 en \n31541 418199646 en \n... ... ... \n53388 444848074 en \n164003 549678226 en \n19193 409424261 en \n158766 545277468 en \n106813 498995405 en \n\n appln_title \n6613 CARD CONNECTOR \n15307 SERVO WRITE ASSEMBLY \n34917 CHILD SLEEPING APPARATUS WITH ADJUSTABLE SLEEP... \n65975 - NEAR-FIELD TRANSDUCER WITH RECESSED REGION \n31541 ELECTROSTATIC SPRAY TOOL SYSTEM \n... ... \n53388 Brassiere shoulder-strap closure \n164003 System and method for validating honest test t... \n19193 Hybrid wind turbine blade bearing \n158766 Video coding with successive codecs \n106813 IMAGE RECOGNITION METHOD AND APPARATUS \n\n[100 rows x 3 columns]", "text/html": "
\n\n\n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n
appln_idappln_title_lgappln_title
6613365740889enCARD CONNECTOR
15307405955962enSERVO WRITE ASSEMBLY
34917420680979enCHILD SLEEPING APPARATUS WITH ADJUSTABLE SLEEP...
65975456943983en- NEAR-FIELD TRANSDUCER WITH RECESSED REGION
31541418199646enELECTROSTATIC SPRAY TOOL SYSTEM
............
53388444848074enBrassiere shoulder-strap closure
164003549678226enSystem and method for validating honest test t...
19193409424261enHybrid wind turbine blade bearing
158766545277468enVideo coding with successive codecs
106813498995405enIMAGE RECOGNITION METHOD AND APPARATUS
\n

100 rows × 3 columns

\n
" }, "execution_count": 22, "metadata": {}, "output_type": "execute_result" } ], "source": [ "appln_title.sample(100)" ], "metadata": { "collapsed": false } }, { "cell_type": "code", "execution_count": 23, "outputs": [ { "data": { "text/plain": " appln_id appln_auth appln_nr appln_kind appln_filing_date \n0 330225325 EP 11150195 A 2011-01-05 \\\n1 330225397 EP 11150231 A 2011-01-05 \n2 330322632 EP 11150485 A 2011-01-10 \n3 330326785 EP 11150605 A 2011-01-11 \n4 330350961 EP 11150683 A 2011-01-12 \n\n appln_filing_year appln_nr_original ipr_type receiving_office \n0 2011 11150195 PI \\\n1 2011 11150231 PI \n2 2011 11150485 PI \n3 2011 11150605 PI \n4 2011 11150683 PI \n\n internat_appln_id ... earliest_pat_publn_id granted docdb_family_id \n0 0 ... 335277427 Y 43754737 \\\n1 0 ... 335277736 Y 43619902 \n2 0 ... 364719889 Y 43991052 \n3 0 ... 335277720 N 43023665 \n4 0 ... 364923578 N 43881056 \n\n inpadoc_family_id docdb_family_size nb_citing_docdb_fam nb_applicants \n0 330225325 4 16 1 \\\n1 330225397 6 56 1 \n2 330322632 2 5 1 \n3 328518903 6 9 1 \n4 330350961 7 13 2 \n\n nb_inventors appln_title_lg \n0 1 en \\\n1 9 en \n2 2 en \n3 3 en \n4 5 en \n\n appln_title \n0 Beverage preparation machine \n1 Screwdriving tool having a driving tool with a... \n2 Method and system for recommending contextual ... \n3 Apparatus and method for continuous casting of... \n4 A method and an apparatus for treating at leas... \n\n[5 rows x 28 columns]", "text/html": "
\n\n\n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n
appln_idappln_authappln_nrappln_kindappln_filing_dateappln_filing_yearappln_nr_originalipr_typereceiving_officeinternat_appln_id...earliest_pat_publn_idgranteddocdb_family_idinpadoc_family_iddocdb_family_sizenb_citing_docdb_famnb_applicantsnb_inventorsappln_title_lgappln_title
0330225325EP11150195A2011-01-05201111150195PI0...335277427Y4375473733022532541611enBeverage preparation machine
1330225397EP11150231A2011-01-05201111150231PI0...335277736Y4361990233022539765619enScrewdriving tool having a driving tool with a...
2330322632EP11150485A2011-01-10201111150485PI0...364719889Y439910523303226322512enMethod and system for recommending contextual ...
3330326785EP11150605A2011-01-11201111150605PI0...335277720N430236653285189036913enApparatus and method for continuous casting of...
4330350961EP11150683A2011-01-12201111150683PI0...364923578N4388105633035096171325enA method and an apparatus for treating at leas...
\n

5 rows × 28 columns

\n
" }, "execution_count": 23, "metadata": {}, "output_type": "execute_result" } ], "source": [ "appln_data = appln.merge(appln_title, on=\"appln_id\")\n", "appln_data.head()" ], "metadata": { "collapsed": false } }, { "cell_type": "code", "execution_count": 24, "outputs": [ { "data": { "text/plain": "array(['EP', 'WO', 'LU', 'FI', 'NO', 'FR', 'GB', 'KR', 'ES', 'US', 'CA',\n 'DO', 'EC', 'DE', 'UY', 'IL', 'SV', 'PL', 'TR', 'CO', 'CR', 'TW',\n 'MA', 'PE', 'SG', 'CU', 'BE', 'DK', 'AR', 'AP', 'HR', 'MX', 'BR',\n 'EA', 'RU', 'AU', 'MC', 'HU', 'PT', 'NL', 'HN', 'AT', 'RO', 'SM',\n 'CH', 'SI', 'IS', 'CZ', 'HK', 'MD', 'JP', 'CN', 'RS', 'GT', 'UA',\n 'CL', 'SK', 'LT', 'PH', 'MY', 'IN', 'VN', 'TN', 'CY', 'GE', 'ZA',\n 'SE', 'ME', 'JO', 'NI', 'SA'], dtype=object)" }, "execution_count": 24, "metadata": {}, "output_type": "execute_result" } ], "source": [ "appln_data[\"appln_auth\"].unique()" ], "metadata": { "collapsed": false } }, { "cell_type": "code", "execution_count": 25, "outputs": [ { "data": { "text/plain": " person_id appln_id applt_seq_nr invt_seq_nr\n0 1 413601768 1 0\n1 21 332015605 1 0\n2 21 333490084 1 0\n3 21 335903805 1 0\n4 76 352908776 1 0\n... ... ... ... ...\n1025446 88836321 577982223 1 0\n1025447 88836333 583342135 0 4\n1025448 88836333 583342207 0 3\n1025449 88836333 585957705 0 5\n1025450 88836337 579601496 0 1\n\n[1025451 rows x 4 columns]", "text/html": "
\n\n\n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n
person_idappln_idapplt_seq_nrinvt_seq_nr
0141360176810
12133201560510
22133349008410
32133590380510
47635290877610
...............
10254468883632157798222310
10254478883633358334213504
10254488883633358334220703
10254498883633358595770505
10254508883633757960149601
\n

1025451 rows × 4 columns

\n
" }, "execution_count": 25, "metadata": {}, "output_type": "execute_result" } ], "source": [ "appln_pers" ], "metadata": { "collapsed": false } }, { "cell_type": "code", "execution_count": 26, "outputs": [ { "data": { "text/plain": " person_id person_name person_name_orig_lg \n0 1 Nokia Corporation Nokia Corporation \\\n1 128 Nokia Siemens Networks Oy Nokia Siemens Networks Oy \n2 5217785 Nokia Corporation Nokia Corporation \n3 5217811 Nokia Corporation Nokia Corporation \n4 5232170 Nokia Siemens Networks Oy Nokia Siemens Networks Oy \n... ... ... ... \n354633 88836234 WONG, Chun Lok WONG, Chun Lok \n354634 88836257 XIAONING YE XIAONING YE \n354635 88836321 ZAI LAB (US) LLC ZAI LAB (US) LLC \n354636 88836333 ZHANG, Haocheng 张皓程 \n354637 88836337 ZHANG, Yangjun ZHANG, Yangjun \n\n person_address person_ctry_code nuts nuts_level \n0 Keilalahdentie 4,02150 Espoo FI FI1B1 3 \\\n1 Karaportti 3,02610 Espoo FI FI1B1 3 \n2 Espoo FI FI 0 \n3 NaN FI FI 0 \n4 Espoo FI FI 0 \n... ... ... ... ... \n354633 NaN US NaN 9 \n354634 Portland, Oregon US US NaN 9 \n354635 NaN US NaN 9 \n354636 NaN US NaN 9 \n354637 NaN US NaN 9 \n\n doc_std_name_id doc_std_name psn_id \n0 1 NOKIA CORP 23782051 \\\n1 112 NOKIA SIEMENS NETWORKS OY 23782129 \n2 1 NOKIA CORP 23782051 \n3 1 NOKIA CORP 23782051 \n4 112 NOKIA SIEMENS NETWORKS OY 23782129 \n... ... ... ... \n354633 30867225 WONG CHUN LOK 188836234 \n354634 8004293 XIAONING YE 188836257 \n354635 39363494 ZAI LAB US LLC 188836321 \n354636 7682590 ZHANG HAOCHENG 188836333 \n354637 2112344 ZHANG YANGJUN 188836337 \n\n psn_name psn_level psn_sector han_id han_name \n0 NOKIA CORPORATION 2 COMPANY 2125445 NOKIA CORP \\\n1 NOKIA NETWORKS 2 COMPANY 2125445 NOKIA CORP \n2 NOKIA CORPORATION 2 COMPANY 2125445 NOKIA CORP \n3 NOKIA CORPORATION 2 COMPANY 2125445 NOKIA CORP \n4 NOKIA NETWORKS 2 COMPANY 2125445 NOKIA CORP \n... ... ... ... ... ... \n354633 WONG, Chun Lok 0 UNKNOWN 188836234 WONG, Chun Lok \n354634 XIAONING YE 0 UNKNOWN 188836257 XIAONING YE \n354635 ZAI LAB (US) LLC 0 UNKNOWN 188836321 ZAI LAB (US) LLC \n354636 ZHANG, Haocheng 0 UNKNOWN 188836333 ZHANG, Haocheng \n354637 ZHANG, Yangjun 0 UNKNOWN 188836337 ZHANG, Yangjun \n\n han_harmonized psn_sector_primary \n0 2 COMPANY \n1 2 COMPANY \n2 2 COMPANY \n3 2 COMPANY \n4 2 COMPANY \n... ... ... \n354633 0 UNKNOWN \n354634 0 UNKNOWN \n354635 0 UNKNOWN \n354636 0 UNKNOWN \n354637 0 UNKNOWN \n\n[354638 rows x 17 columns]", "text/html": "
\n\n\n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n
person_idperson_nameperson_name_orig_lgperson_addressperson_ctry_codenutsnuts_leveldoc_std_name_iddoc_std_namepsn_idpsn_namepsn_levelpsn_sectorhan_idhan_namehan_harmonizedpsn_sector_primary
01Nokia CorporationNokia CorporationKeilalahdentie 4,02150 EspooFIFI1B131NOKIA CORP23782051NOKIA CORPORATION2COMPANY2125445NOKIA CORP2COMPANY
1128Nokia Siemens Networks OyNokia Siemens Networks OyKaraportti 3,02610 EspooFIFI1B13112NOKIA SIEMENS NETWORKS OY23782129NOKIA NETWORKS2COMPANY2125445NOKIA CORP2COMPANY
25217785Nokia CorporationNokia CorporationEspooFIFI01NOKIA CORP23782051NOKIA CORPORATION2COMPANY2125445NOKIA CORP2COMPANY
35217811Nokia CorporationNokia CorporationNaNFIFI01NOKIA CORP23782051NOKIA CORPORATION2COMPANY2125445NOKIA CORP2COMPANY
45232170Nokia Siemens Networks OyNokia Siemens Networks OyEspooFIFI0112NOKIA SIEMENS NETWORKS OY23782129NOKIA NETWORKS2COMPANY2125445NOKIA CORP2COMPANY
......................................................
35463388836234WONG, Chun LokWONG, Chun LokNaNUSNaN930867225WONG CHUN LOK188836234WONG, Chun Lok0UNKNOWN188836234WONG, Chun Lok0UNKNOWN
35463488836257XIAONING YEXIAONING YEPortland, Oregon USUSNaN98004293XIAONING YE188836257XIAONING YE0UNKNOWN188836257XIAONING YE0UNKNOWN
35463588836321ZAI LAB (US) LLCZAI LAB (US) LLCNaNUSNaN939363494ZAI LAB US LLC188836321ZAI LAB (US) LLC0UNKNOWN188836321ZAI LAB (US) LLC0UNKNOWN
35463688836333ZHANG, Haocheng张皓程NaNUSNaN97682590ZHANG HAOCHENG188836333ZHANG, Haocheng0UNKNOWN188836333ZHANG, Haocheng0UNKNOWN
35463788836337ZHANG, YangjunZHANG, YangjunNaNUSNaN92112344ZHANG YANGJUN188836337ZHANG, Yangjun0UNKNOWN188836337ZHANG, Yangjun0UNKNOWN
\n

354638 rows × 17 columns

\n
" }, "execution_count": 17, "metadata": {}, "output_type": "execute_result" }, { "data": { "text/plain": " person_id person_name person_name_orig_lg \n0 1 Nokia Corporation Nokia Corporation \\\n1 128 Nokia Siemens Networks Oy Nokia Siemens Networks Oy \n2 5217785 Nokia Corporation Nokia Corporation \n3 5217811 Nokia Corporation Nokia Corporation \n4 5232170 Nokia Siemens Networks Oy Nokia Siemens Networks Oy \n... ... ... ... \n354633 88836234 WONG, Chun Lok WONG, Chun Lok \n354634 88836257 XIAONING YE XIAONING YE \n354635 88836321 ZAI LAB (US) LLC ZAI LAB (US) LLC \n354636 88836333 ZHANG, Haocheng 张皓程 \n354637 88836337 ZHANG, Yangjun ZHANG, Yangjun \n\n person_address person_ctry_code nuts nuts_level \n0 Keilalahdentie 4,02150 Espoo FI FI1B1 3 \\\n1 Karaportti 3,02610 Espoo FI FI1B1 3 \n2 Espoo FI FI 0 \n3 NaN FI FI 0 \n4 Espoo FI FI 0 \n... ... ... ... ... \n354633 NaN US NaN 9 \n354634 Portland, Oregon US US NaN 9 \n354635 NaN US NaN 9 \n354636 NaN US NaN 9 \n354637 NaN US NaN 9 \n\n doc_std_name_id doc_std_name psn_id \n0 1 NOKIA CORP 23782051 \\\n1 112 NOKIA SIEMENS NETWORKS OY 23782129 \n2 1 NOKIA CORP 23782051 \n3 1 NOKIA CORP 23782051 \n4 112 NOKIA SIEMENS NETWORKS OY 23782129 \n... ... ... ... \n354633 30867225 WONG CHUN LOK 188836234 \n354634 8004293 XIAONING YE 188836257 \n354635 39363494 ZAI LAB US LLC 188836321 \n354636 7682590 ZHANG HAOCHENG 188836333 \n354637 2112344 ZHANG YANGJUN 188836337 \n\n psn_name psn_level psn_sector han_id han_name \n0 NOKIA CORPORATION 2 COMPANY 2125445 NOKIA CORP \\\n1 NOKIA NETWORKS 2 COMPANY 2125445 NOKIA CORP \n2 NOKIA CORPORATION 2 COMPANY 2125445 NOKIA CORP \n3 NOKIA CORPORATION 2 COMPANY 2125445 NOKIA CORP \n4 NOKIA NETWORKS 2 COMPANY 2125445 NOKIA CORP \n... ... ... ... ... ... \n354633 WONG, Chun Lok 0 UNKNOWN 188836234 WONG, Chun Lok \n354634 XIAONING YE 0 UNKNOWN 188836257 XIAONING YE \n354635 ZAI LAB (US) LLC 0 UNKNOWN 188836321 ZAI LAB (US) LLC \n354636 ZHANG, Haocheng 0 UNKNOWN 188836333 ZHANG, Haocheng \n354637 ZHANG, Yangjun 0 UNKNOWN 188836337 ZHANG, Yangjun \n\n han_harmonized psn_sector_primary \n0 2 COMPANY \n1 2 COMPANY \n2 2 COMPANY \n3 2 COMPANY \n4 2 COMPANY \n... ... ... \n354633 0 UNKNOWN \n354634 0 UNKNOWN \n354635 0 UNKNOWN \n354636 0 UNKNOWN \n354637 0 UNKNOWN \n\n[354638 rows x 17 columns]", "text/html": "
\n\n\n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n
person_idperson_nameperson_name_orig_lgperson_addressperson_ctry_codenutsnuts_leveldoc_std_name_iddoc_std_namepsn_idpsn_namepsn_levelpsn_sectorhan_idhan_namehan_harmonizedpsn_sector_primary
01Nokia CorporationNokia CorporationKeilalahdentie 4,02150 EspooFIFI1B131NOKIA CORP23782051NOKIA CORPORATION2COMPANY2125445NOKIA CORP2COMPANY
1128Nokia Siemens Networks OyNokia Siemens Networks OyKaraportti 3,02610 EspooFIFI1B13112NOKIA SIEMENS NETWORKS OY23782129NOKIA NETWORKS2COMPANY2125445NOKIA CORP2COMPANY
25217785Nokia CorporationNokia CorporationEspooFIFI01NOKIA CORP23782051NOKIA CORPORATION2COMPANY2125445NOKIA CORP2COMPANY
35217811Nokia CorporationNokia CorporationNaNFIFI01NOKIA CORP23782051NOKIA CORPORATION2COMPANY2125445NOKIA CORP2COMPANY
45232170Nokia Siemens Networks OyNokia Siemens Networks OyEspooFIFI0112NOKIA SIEMENS NETWORKS OY23782129NOKIA NETWORKS2COMPANY2125445NOKIA CORP2COMPANY
......................................................
35463388836234WONG, Chun LokWONG, Chun LokNaNUSNaN930867225WONG CHUN LOK188836234WONG, Chun Lok0UNKNOWN188836234WONG, Chun Lok0UNKNOWN
35463488836257XIAONING YEXIAONING YEPortland, Oregon USUSNaN98004293XIAONING YE188836257XIAONING YE0UNKNOWN188836257XIAONING YE0UNKNOWN
35463588836321ZAI LAB (US) LLCZAI LAB (US) LLCNaNUSNaN939363494ZAI LAB US LLC188836321ZAI LAB (US) LLC0UNKNOWN188836321ZAI LAB (US) LLC0UNKNOWN
35463688836333ZHANG, Haocheng张皓程NaNUSNaN97682590ZHANG HAOCHENG188836333ZHANG, Haocheng0UNKNOWN188836333ZHANG, Haocheng0UNKNOWN
35463788836337ZHANG, YangjunZHANG, YangjunNaNUSNaN92112344ZHANG YANGJUN188836337ZHANG, Yangjun0UNKNOWN188836337ZHANG, Yangjun0UNKNOWN
\n

354638 rows × 17 columns

\n
" }, "execution_count": 26, "metadata": {}, "output_type": "execute_result" } ], "source": [ "pers_sector_primary = pers.groupby(\"han_id\", as_index=False)[\"psn_sector\"].agg(\n", " lambda x: pd.Series.mode(x)[0]).rename(columns={\"psn_sector\":\"psn_sector_primary\"})\n", "persn = pers.merge(pers_sector_primary, on='han_id')\n", "persn" ], "metadata": { "collapsed": false } }, { "cell_type": "code", "execution_count": 27, "outputs": [ { "data": { "text/plain": " han_id psn_sector_primary\n0 32 COMPANY\n1 54 COMPANY\n2 83 COMPANY\n3 200 COMPANY\n4 264 GOV NON-PROFIT UNIVERSITY\n... ... ...\n335519 188836234 UNKNOWN\n335520 188836257 UNKNOWN\n335521 188836321 UNKNOWN\n335522 188836333 UNKNOWN\n335523 188836337 UNKNOWN\n\n[335524 rows x 2 columns]", "text/html": "
\n\n\n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n
han_idpsn_sector_primary
032COMPANY
154COMPANY
283COMPANY
3200COMPANY
4264GOV NON-PROFIT UNIVERSITY
.........
335519188836234UNKNOWN
335520188836257UNKNOWN
335521188836321UNKNOWN
335522188836333UNKNOWN
335523188836337UNKNOWN
\n

335524 rows × 2 columns

\n
" }, "execution_count": 18, "metadata": {}, "output_type": "execute_result" }, { "data": { "text/plain": " han_id psn_sector_primary\n0 32 COMPANY\n1 54 COMPANY\n2 83 COMPANY\n3 200 COMPANY\n4 264 GOV NON-PROFIT UNIVERSITY\n... ... ...\n335519 188836234 UNKNOWN\n335520 188836257 UNKNOWN\n335521 188836321 UNKNOWN\n335522 188836333 UNKNOWN\n335523 188836337 UNKNOWN\n\n[335524 rows x 2 columns]", "text/html": "
\n\n\n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n
han_idpsn_sector_primary
032COMPANY
154COMPANY
283COMPANY
3200COMPANY
4264GOV NON-PROFIT UNIVERSITY
.........
335519188836234UNKNOWN
335520188836257UNKNOWN
335521188836321UNKNOWN
335522188836333UNKNOWN
335523188836337UNKNOWN
\n

335524 rows × 2 columns

\n
" }, "execution_count": 27, "metadata": {}, "output_type": "execute_result" } ], "source": [ "pers_sector_primary" ], "metadata": { "collapsed": false } }, { "cell_type": "code", "execution_count": 27, "outputs": [], "source": [], "metadata": { "collapsed": false } }, { "cell_type": "code", "execution_count": 28, "outputs": [], "source": [ "appln_merge = appln.merge(appln_title, on=\"appln_id\")#.merge(appln_pers,on=\"appln_id\")\n", "appln_merge.to_excel(\"appln_data.xlsx\", index=False)" ], "metadata": { "collapsed": false } }, { "cell_type": "code", "execution_count": 29, "outputs": [], "source": [ "person_merge = appln_pers.merge(pers,on=\"person_id\")\n", "person_merge.to_excel(\"person_data.xlsx\", index=False)" ], "metadata": { "collapsed": false } }, { "cell_type": "code", "execution_count": 30, "outputs": [ { "data": { "text/plain": "array(['FI', 'NL', 'FR', 'CH', 'US', 'DE', 'DK', 'AT', 'SE', 'BE', 'CN',\n 'IT', 'LU', 'IE', 'SI', 'HK', 'MO', 'CZ', 'ES', 'NO', 'PL', 'HU',\n 'CY', 'SK', 'PT', 'EE', 'MT', 'GR', 'RO', 'BG', 'LT', 'HR', 'LV'],\n dtype=object)" }, "execution_count": 30, "metadata": {}, "output_type": "execute_result" } ], "source": [ "pers[\"person_ctry_code\"].unique()" ], "metadata": { "collapsed": false } } ], "metadata": { "kernelspec": { "display_name": "Python 3", "language": "python", "name": "python3" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 2 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython2", "version": "2.7.6" } }, "nbformat": 4, "nbformat_minor": 0 }