From 444158b9f0b0f600ac98fddc8675296db9be0094 Mon Sep 17 00:00:00 2001 From: radvanyimome Date: Mon, 12 Jun 2023 09:19:08 +0200 Subject: [PATCH] ADD: PATSTAT CPC taxonomy and AI/ML/DB related groupsearch based on WOS keywords --- PATSTAT/patstat_analysis_pipeline.ipynb | 118 +++++++++++------------- PATSTAT/patstat_cpc_parse.ipynb | 78 +++++++++++----- 2 files changed, 111 insertions(+), 85 deletions(-) diff --git a/PATSTAT/patstat_analysis_pipeline.ipynb b/PATSTAT/patstat_analysis_pipeline.ipynb index b738328..b41bcf2 100644 --- a/PATSTAT/patstat_analysis_pipeline.ipynb +++ b/PATSTAT/patstat_analysis_pipeline.ipynb @@ -2,7 +2,7 @@ "cells": [ { "cell_type": "code", - "execution_count": 1, + "execution_count": 19, "metadata": { "collapsed": true }, @@ -20,7 +20,7 @@ }, { "cell_type": "code", - "execution_count": 3, + "execution_count": 20, "outputs": [], "source": [ "outdir=\"WESTERN_CH_scope\"\n", @@ -42,13 +42,13 @@ }, { "cell_type": "code", - "execution_count": 5, + "execution_count": 21, "outputs": [ { "data": { "text/plain": "203873" }, - "execution_count": 5, + "execution_count": 21, "metadata": {}, "output_type": "execute_result" } @@ -62,14 +62,14 @@ }, { "cell_type": "code", - "execution_count": 7, + "execution_count": 22, "outputs": [ { "data": { - "text/plain": " appln_id appln_title_lg \n106316 498640253 en \\\n119852 511974583 en \n193586 577006640 en \n172207 556318748 en \n117620 509549284 en \n... ... ... \n58791 448189845 en \n119362 511604550 en \n73722 471815906 en \n45133 438311946 en \n25978 414431520 en \n\n appln_title \n106316 DRAIN CLEANING DEVICE \n119852 Antenna panel switching and beam indication \n193586 Loft bed \n172207 Winch for Securing a Load \n117620 TEMPERATURE CONTROL APPARATUS FORELECTRIC VEHI... \n... ... \n58791 Collaborative spectrum sensing in cognitive ra... \n119362 CLIP-ON GLASSES WITH REPLACEABLE LENS \n73722 Sensitized, photo-sensitive glass and its prod... \n45133 PREPARATION OF 3,4-DIHYDRO-1,4-BENZOXAZEPIN-5(... \n25978 - CRYSTAL OSCILLATOR WITH LOW-POWER MODE \n\n[100 rows x 3 columns]", - "text/html": "
\n\n\n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n
appln_idappln_title_lgappln_title
106316498640253enDRAIN CLEANING DEVICE
119852511974583enAntenna panel switching and beam indication
193586577006640enLoft bed
172207556318748enWinch for Securing a Load
117620509549284enTEMPERATURE CONTROL APPARATUS FORELECTRIC VEHI...
............
58791448189845enCollaborative spectrum sensing in cognitive ra...
119362511604550enCLIP-ON GLASSES WITH REPLACEABLE LENS
73722471815906enSensitized, photo-sensitive glass and its prod...
45133438311946enPREPARATION OF 3,4-DIHYDRO-1,4-BENZOXAZEPIN-5(...
25978414431520en- CRYSTAL OSCILLATOR WITH LOW-POWER MODE
\n

100 rows × 3 columns

\n
" + "text/plain": " appln_id appln_title_lg \n6613 365740889 en \\\n15307 405955962 en \n34917 420680979 en \n65975 456943983 en \n31541 418199646 en \n... ... ... \n53388 444848074 en \n164003 549678226 en \n19193 409424261 en \n158766 545277468 en \n106813 498995405 en \n\n appln_title \n6613 CARD CONNECTOR \n15307 SERVO WRITE ASSEMBLY \n34917 CHILD SLEEPING APPARATUS WITH ADJUSTABLE SLEEP... \n65975 - NEAR-FIELD TRANSDUCER WITH RECESSED REGION \n31541 ELECTROSTATIC SPRAY TOOL SYSTEM \n... ... \n53388 Brassiere shoulder-strap closure \n164003 System and method for validating honest test t... \n19193 Hybrid wind turbine blade bearing \n158766 Video coding with successive codecs \n106813 IMAGE RECOGNITION METHOD AND APPARATUS \n\n[100 rows x 3 columns]", + "text/html": "
\n\n\n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n
appln_idappln_title_lgappln_title
6613365740889enCARD CONNECTOR
15307405955962enSERVO WRITE ASSEMBLY
34917420680979enCHILD SLEEPING APPARATUS WITH ADJUSTABLE SLEEP...
65975456943983en- NEAR-FIELD TRANSDUCER WITH RECESSED REGION
31541418199646enELECTROSTATIC SPRAY TOOL SYSTEM
............
53388444848074enBrassiere shoulder-strap closure
164003549678226enSystem and method for validating honest test t...
19193409424261enHybrid wind turbine blade bearing
158766545277468enVideo coding with successive codecs
106813498995405enIMAGE RECOGNITION METHOD AND APPARATUS
\n

100 rows × 3 columns

\n
" }, - "execution_count": 7, + "execution_count": 22, "metadata": {}, "output_type": "execute_result" } @@ -83,14 +83,14 @@ }, { "cell_type": "code", - "execution_count": 8, + "execution_count": 23, "outputs": [ { "data": { "text/plain": " appln_id appln_auth appln_nr appln_kind appln_filing_date \n0 330225325 EP 11150195 A 2011-01-05 \\\n1 330225397 EP 11150231 A 2011-01-05 \n2 330322632 EP 11150485 A 2011-01-10 \n3 330326785 EP 11150605 A 2011-01-11 \n4 330350961 EP 11150683 A 2011-01-12 \n\n appln_filing_year appln_nr_original ipr_type receiving_office \n0 2011 11150195 PI \\\n1 2011 11150231 PI \n2 2011 11150485 PI \n3 2011 11150605 PI \n4 2011 11150683 PI \n\n internat_appln_id ... earliest_pat_publn_id granted docdb_family_id \n0 0 ... 335277427 Y 43754737 \\\n1 0 ... 335277736 Y 43619902 \n2 0 ... 364719889 Y 43991052 \n3 0 ... 335277720 N 43023665 \n4 0 ... 364923578 N 43881056 \n\n inpadoc_family_id docdb_family_size nb_citing_docdb_fam nb_applicants \n0 330225325 4 16 1 \\\n1 330225397 6 56 1 \n2 330322632 2 5 1 \n3 328518903 6 9 1 \n4 330350961 7 13 2 \n\n nb_inventors appln_title_lg \n0 1 en \\\n1 9 en \n2 2 en \n3 3 en \n4 5 en \n\n appln_title \n0 Beverage preparation machine \n1 Screwdriving tool having a driving tool with a... \n2 Method and system for recommending contextual ... \n3 Apparatus and method for continuous casting of... \n4 A method and an apparatus for treating at leas... \n\n[5 rows x 28 columns]", "text/html": "
\n\n\n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n
appln_idappln_authappln_nrappln_kindappln_filing_dateappln_filing_yearappln_nr_originalipr_typereceiving_officeinternat_appln_id...earliest_pat_publn_idgranteddocdb_family_idinpadoc_family_iddocdb_family_sizenb_citing_docdb_famnb_applicantsnb_inventorsappln_title_lgappln_title
0330225325EP11150195A2011-01-05201111150195PI0...335277427Y4375473733022532541611enBeverage preparation machine
1330225397EP11150231A2011-01-05201111150231PI0...335277736Y4361990233022539765619enScrewdriving tool having a driving tool with a...
2330322632EP11150485A2011-01-10201111150485PI0...364719889Y439910523303226322512enMethod and system for recommending contextual ...
3330326785EP11150605A2011-01-11201111150605PI0...335277720N430236653285189036913enApparatus and method for continuous casting of...
4330350961EP11150683A2011-01-12201111150683PI0...364923578N4388105633035096171325enA method and an apparatus for treating at leas...
\n

5 rows × 28 columns

\n
" }, - "execution_count": 8, + "execution_count": 23, "metadata": {}, "output_type": "execute_result" } @@ -105,13 +105,13 @@ }, { "cell_type": "code", - "execution_count": 9, + "execution_count": 24, "outputs": [ { "data": { "text/plain": "array(['EP', 'WO', 'LU', 'FI', 'NO', 'FR', 'GB', 'KR', 'ES', 'US', 'CA',\n 'DO', 'EC', 'DE', 'UY', 'IL', 'SV', 'PL', 'TR', 'CO', 'CR', 'TW',\n 'MA', 'PE', 'SG', 'CU', 'BE', 'DK', 'AR', 'AP', 'HR', 'MX', 'BR',\n 'EA', 'RU', 'AU', 'MC', 'HU', 'PT', 'NL', 'HN', 'AT', 'RO', 'SM',\n 'CH', 'SI', 'IS', 'CZ', 'HK', 'MD', 'JP', 'CN', 'RS', 'GT', 'UA',\n 'CL', 'SK', 'LT', 'PH', 'MY', 'IN', 'VN', 'TN', 'CY', 'GE', 'ZA',\n 'SE', 'ME', 'JO', 'NI', 'SA'], dtype=object)" }, - "execution_count": 9, + "execution_count": 24, "metadata": {}, "output_type": "execute_result" } @@ -125,14 +125,14 @@ }, { "cell_type": "code", - "execution_count": 8, + "execution_count": 25, "outputs": [ { "data": { - "text/plain": " person_id appln_id applt_seq_nr invt_seq_nr\n0 1 340314532 1 0\n1 1 413601768 1 0\n2 21 332015605 1 0\n3 21 333490084 1 0\n4 21 335903805 1 0\n... ... ... ... ...\n274039 85719932 545918634 0 2\n274040 85720336 569409547 0 4\n274041 85720376 555215896 0 2\n274042 85720469 569304088 0 5\n274043 85720500 569495993 0 5\n\n[274044 rows x 4 columns]", - "text/html": "
\n\n\n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n
person_idappln_idapplt_seq_nrinvt_seq_nr
0134031453210
1141360176810
22133201560510
32133349008410
42133590380510
...............
2740398571993254591863402
2740408572033656940954704
2740418572037655521589602
2740428572046956930408805
2740438572050056949599305
\n

274044 rows × 4 columns

\n
" + "text/plain": " person_id appln_id applt_seq_nr invt_seq_nr\n0 1 413601768 1 0\n1 21 332015605 1 0\n2 21 333490084 1 0\n3 21 335903805 1 0\n4 76 352908776 1 0\n... ... ... ... ...\n1025446 88836321 577982223 1 0\n1025447 88836333 583342135 0 4\n1025448 88836333 583342207 0 3\n1025449 88836333 585957705 0 5\n1025450 88836337 579601496 0 1\n\n[1025451 rows x 4 columns]", + "text/html": "
\n\n\n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n
person_idappln_idapplt_seq_nrinvt_seq_nr
0141360176810
12133201560510
22133349008410
32133590380510
47635290877610
...............
10254468883632157798222310
10254478883633358334213504
10254488883633358334220703
10254498883633358595770505
10254508883633757960149601
\n

1025451 rows × 4 columns

\n
" }, - "execution_count": 8, + "execution_count": 25, "metadata": {}, "output_type": "execute_result" } @@ -146,14 +146,23 @@ }, { "cell_type": "code", - "execution_count": 37, + "execution_count": 26, "outputs": [ { "data": { - "text/plain": " person_id person_name person_name_orig_lg \n0 1 Nokia Corporation Nokia Corporation \\\n1 128 Nokia Siemens Networks Oy Nokia Siemens Networks Oy \n2 5217785 Nokia Corporation Nokia Corporation \n3 5217811 Nokia Corporation Nokia Corporation \n4 5232170 Nokia Siemens Networks Oy Nokia Siemens Networks Oy \n... ... ... ... \n112235 85719932 VIKSTREM, Erik ВИКСТРЁМ, Эрик \n112236 85720336 HWANG, LING-CHI HWANG, LING-CHI \n112237 85720376 LI, I Chan LI, I Chan \n112238 85720469 TING, Chia Ching TING, Chia Ching \n112239 85720500 WANG, YU-CHEIH WANG, YU-CHEIH \n\n person_address person_ctry_code nuts nuts_level \n0 Keilalahdentie 4,02150 Espoo FI FI1B1 3 \\\n1 Karaportti 3,02610 Espoo FI FI1B1 3 \n2 Espoo FI FI 0 \n3 NaN FI FI 0 \n4 Espoo FI FI 0 \n... ... ... ... ... \n112235 NaN SE SE 0 \n112236 NaN TW NaN 9 \n112237 NaN TW NaN 9 \n112238 TW TW NaN 9 \n112239 NaN TW NaN 9 \n\n doc_std_name_id doc_std_name psn_id \n0 1 NOKIA CORP 23782051 \\\n1 112 NOKIA SIEMENS NETWORKS OY 23782129 \n2 1 NOKIA CORP 23782051 \n3 1 NOKIA CORP 23782051 \n4 112 NOKIA SIEMENS NETWORKS OY 23782129 \n... ... ... ... \n112235 38919340 VIKSTREM ERIK 185719932 \n112236 35599384 HWANG LING-CHI 185720336 \n112237 38707281 LI I CHAN 185720376 \n112238 23937900 TING CHIA CHING 185720469 \n112239 38204835 WANG YU-CHEIH 185720500 \n\n psn_name psn_level psn_sector han_id han_name \n0 NOKIA CORPORATION 2 COMPANY 2125445 NOKIA CORP \\\n1 NOKIA NETWORKS 2 COMPANY 2125445 NOKIA CORP \n2 NOKIA CORPORATION 2 COMPANY 2125445 NOKIA CORP \n3 NOKIA CORPORATION 2 COMPANY 2125445 NOKIA CORP \n4 NOKIA NETWORKS 2 COMPANY 2125445 NOKIA CORP \n... ... ... ... ... ... \n112235 VIKSTREM, Erik 0 UNKNOWN 185719932 VIKSTREM, Erik \n112236 HWANG, LING-CHI 0 UNKNOWN 185720336 HWANG, LING-CHI \n112237 LI, I Chan 0 UNKNOWN 185720376 LI, I Chan \n112238 TING, Chia Ching 0 UNKNOWN 185720469 TING, Chia Ching \n112239 WANG, YU-CHEIH 0 UNKNOWN 185720500 WANG, YU-CHEIH \n\n han_harmonized psn_sector_primary \n0 2 COMPANY \n1 2 COMPANY \n2 2 COMPANY \n3 2 COMPANY \n4 2 COMPANY \n... ... ... \n112235 0 UNKNOWN \n112236 0 UNKNOWN \n112237 0 UNKNOWN \n112238 0 UNKNOWN \n112239 0 UNKNOWN \n\n[112240 rows x 17 columns]", - "text/html": "
\n\n\n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n
person_idperson_nameperson_name_orig_lgperson_addressperson_ctry_codenutsnuts_leveldoc_std_name_iddoc_std_namepsn_idpsn_namepsn_levelpsn_sectorhan_idhan_namehan_harmonizedpsn_sector_primary
01Nokia CorporationNokia CorporationKeilalahdentie 4,02150 EspooFIFI1B131NOKIA CORP23782051NOKIA CORPORATION2COMPANY2125445NOKIA CORP2COMPANY
1128Nokia Siemens Networks OyNokia Siemens Networks OyKaraportti 3,02610 EspooFIFI1B13112NOKIA SIEMENS NETWORKS OY23782129NOKIA NETWORKS2COMPANY2125445NOKIA CORP2COMPANY
25217785Nokia CorporationNokia CorporationEspooFIFI01NOKIA CORP23782051NOKIA CORPORATION2COMPANY2125445NOKIA CORP2COMPANY
35217811Nokia CorporationNokia CorporationNaNFIFI01NOKIA CORP23782051NOKIA CORPORATION2COMPANY2125445NOKIA CORP2COMPANY
45232170Nokia Siemens Networks OyNokia Siemens Networks OyEspooFIFI0112NOKIA SIEMENS NETWORKS OY23782129NOKIA NETWORKS2COMPANY2125445NOKIA CORP2COMPANY
......................................................
11223585719932VIKSTREM, ErikВИКСТРЁМ, ЭрикNaNSESE038919340VIKSTREM ERIK185719932VIKSTREM, Erik0UNKNOWN185719932VIKSTREM, Erik0UNKNOWN
11223685720336HWANG, LING-CHIHWANG, LING-CHINaNTWNaN935599384HWANG LING-CHI185720336HWANG, LING-CHI0UNKNOWN185720336HWANG, LING-CHI0UNKNOWN
11223785720376LI, I ChanLI, I ChanNaNTWNaN938707281LI I CHAN185720376LI, I Chan0UNKNOWN185720376LI, I Chan0UNKNOWN
11223885720469TING, Chia ChingTING, Chia ChingTWTWNaN923937900TING CHIA CHING185720469TING, Chia Ching0UNKNOWN185720469TING, Chia Ching0UNKNOWN
11223985720500WANG, YU-CHEIHWANG, YU-CHEIHNaNTWNaN938204835WANG YU-CHEIH185720500WANG, YU-CHEIH0UNKNOWN185720500WANG, YU-CHEIH0UNKNOWN
\n

112240 rows × 17 columns

\n
" + "text/plain": " person_id person_name person_name_orig_lg \n0 1 Nokia Corporation Nokia Corporation \\\n1 128 Nokia Siemens Networks Oy Nokia Siemens Networks Oy \n2 5217785 Nokia Corporation Nokia Corporation \n3 5217811 Nokia Corporation Nokia Corporation \n4 5232170 Nokia Siemens Networks Oy Nokia Siemens Networks Oy \n... ... ... ... \n354633 88836234 WONG, Chun Lok WONG, Chun Lok \n354634 88836257 XIAONING YE XIAONING YE \n354635 88836321 ZAI LAB (US) LLC ZAI LAB (US) LLC \n354636 88836333 ZHANG, Haocheng 张皓程 \n354637 88836337 ZHANG, Yangjun ZHANG, Yangjun \n\n person_address person_ctry_code nuts nuts_level \n0 Keilalahdentie 4,02150 Espoo FI FI1B1 3 \\\n1 Karaportti 3,02610 Espoo FI FI1B1 3 \n2 Espoo FI FI 0 \n3 NaN FI FI 0 \n4 Espoo FI FI 0 \n... ... ... ... ... \n354633 NaN US NaN 9 \n354634 Portland, Oregon US US NaN 9 \n354635 NaN US NaN 9 \n354636 NaN US NaN 9 \n354637 NaN US NaN 9 \n\n doc_std_name_id doc_std_name psn_id \n0 1 NOKIA CORP 23782051 \\\n1 112 NOKIA SIEMENS NETWORKS OY 23782129 \n2 1 NOKIA CORP 23782051 \n3 1 NOKIA CORP 23782051 \n4 112 NOKIA SIEMENS NETWORKS OY 23782129 \n... ... ... ... \n354633 30867225 WONG CHUN LOK 188836234 \n354634 8004293 XIAONING YE 188836257 \n354635 39363494 ZAI LAB US LLC 188836321 \n354636 7682590 ZHANG HAOCHENG 188836333 \n354637 2112344 ZHANG YANGJUN 188836337 \n\n psn_name psn_level psn_sector han_id han_name \n0 NOKIA CORPORATION 2 COMPANY 2125445 NOKIA CORP \\\n1 NOKIA NETWORKS 2 COMPANY 2125445 NOKIA CORP \n2 NOKIA CORPORATION 2 COMPANY 2125445 NOKIA CORP \n3 NOKIA CORPORATION 2 COMPANY 2125445 NOKIA CORP \n4 NOKIA NETWORKS 2 COMPANY 2125445 NOKIA CORP \n... ... ... ... ... ... \n354633 WONG, Chun Lok 0 UNKNOWN 188836234 WONG, Chun Lok \n354634 XIAONING YE 0 UNKNOWN 188836257 XIAONING YE \n354635 ZAI LAB (US) LLC 0 UNKNOWN 188836321 ZAI LAB (US) LLC \n354636 ZHANG, Haocheng 0 UNKNOWN 188836333 ZHANG, Haocheng \n354637 ZHANG, Yangjun 0 UNKNOWN 188836337 ZHANG, Yangjun \n\n han_harmonized psn_sector_primary \n0 2 COMPANY \n1 2 COMPANY \n2 2 COMPANY \n3 2 COMPANY \n4 2 COMPANY \n... ... ... \n354633 0 UNKNOWN \n354634 0 UNKNOWN \n354635 0 UNKNOWN \n354636 0 UNKNOWN \n354637 0 UNKNOWN \n\n[354638 rows x 17 columns]", + "text/html": "
\n\n\n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n
person_idperson_nameperson_name_orig_lgperson_addressperson_ctry_codenutsnuts_leveldoc_std_name_iddoc_std_namepsn_idpsn_namepsn_levelpsn_sectorhan_idhan_namehan_harmonizedpsn_sector_primary
01Nokia CorporationNokia CorporationKeilalahdentie 4,02150 EspooFIFI1B131NOKIA CORP23782051NOKIA CORPORATION2COMPANY2125445NOKIA CORP2COMPANY
1128Nokia Siemens Networks OyNokia Siemens Networks OyKaraportti 3,02610 EspooFIFI1B13112NOKIA SIEMENS NETWORKS OY23782129NOKIA NETWORKS2COMPANY2125445NOKIA CORP2COMPANY
25217785Nokia CorporationNokia CorporationEspooFIFI01NOKIA CORP23782051NOKIA CORPORATION2COMPANY2125445NOKIA CORP2COMPANY
35217811Nokia CorporationNokia CorporationNaNFIFI01NOKIA CORP23782051NOKIA CORPORATION2COMPANY2125445NOKIA CORP2COMPANY
45232170Nokia Siemens Networks OyNokia Siemens Networks OyEspooFIFI0112NOKIA SIEMENS NETWORKS OY23782129NOKIA NETWORKS2COMPANY2125445NOKIA CORP2COMPANY
......................................................
35463388836234WONG, Chun LokWONG, Chun LokNaNUSNaN930867225WONG CHUN LOK188836234WONG, Chun Lok0UNKNOWN188836234WONG, Chun Lok0UNKNOWN
35463488836257XIAONING YEXIAONING YEPortland, Oregon USUSNaN98004293XIAONING YE188836257XIAONING YE0UNKNOWN188836257XIAONING YE0UNKNOWN
35463588836321ZAI LAB (US) LLCZAI LAB (US) LLCNaNUSNaN939363494ZAI LAB US LLC188836321ZAI LAB (US) LLC0UNKNOWN188836321ZAI LAB (US) LLC0UNKNOWN
35463688836333ZHANG, Haocheng张皓程NaNUSNaN97682590ZHANG HAOCHENG188836333ZHANG, Haocheng0UNKNOWN188836333ZHANG, Haocheng0UNKNOWN
35463788836337ZHANG, YangjunZHANG, YangjunNaNUSNaN92112344ZHANG YANGJUN188836337ZHANG, Yangjun0UNKNOWN188836337ZHANG, Yangjun0UNKNOWN
\n

354638 rows × 17 columns

\n
" }, - "execution_count": 37, + "execution_count": 17, + "metadata": {}, + "output_type": "execute_result" + }, + { + "data": { + "text/plain": " person_id person_name person_name_orig_lg \n0 1 Nokia Corporation Nokia Corporation \\\n1 128 Nokia Siemens Networks Oy Nokia Siemens Networks Oy \n2 5217785 Nokia Corporation Nokia Corporation \n3 5217811 Nokia Corporation Nokia Corporation \n4 5232170 Nokia Siemens Networks Oy Nokia Siemens Networks Oy \n... ... ... ... \n354633 88836234 WONG, Chun Lok WONG, Chun Lok \n354634 88836257 XIAONING YE XIAONING YE \n354635 88836321 ZAI LAB (US) LLC ZAI LAB (US) LLC \n354636 88836333 ZHANG, Haocheng 张皓程 \n354637 88836337 ZHANG, Yangjun ZHANG, Yangjun \n\n person_address person_ctry_code nuts nuts_level \n0 Keilalahdentie 4,02150 Espoo FI FI1B1 3 \\\n1 Karaportti 3,02610 Espoo FI FI1B1 3 \n2 Espoo FI FI 0 \n3 NaN FI FI 0 \n4 Espoo FI FI 0 \n... ... ... ... ... \n354633 NaN US NaN 9 \n354634 Portland, Oregon US US NaN 9 \n354635 NaN US NaN 9 \n354636 NaN US NaN 9 \n354637 NaN US NaN 9 \n\n doc_std_name_id doc_std_name psn_id \n0 1 NOKIA CORP 23782051 \\\n1 112 NOKIA SIEMENS NETWORKS OY 23782129 \n2 1 NOKIA CORP 23782051 \n3 1 NOKIA CORP 23782051 \n4 112 NOKIA SIEMENS NETWORKS OY 23782129 \n... ... ... ... \n354633 30867225 WONG CHUN LOK 188836234 \n354634 8004293 XIAONING YE 188836257 \n354635 39363494 ZAI LAB US LLC 188836321 \n354636 7682590 ZHANG HAOCHENG 188836333 \n354637 2112344 ZHANG YANGJUN 188836337 \n\n psn_name psn_level psn_sector han_id han_name \n0 NOKIA CORPORATION 2 COMPANY 2125445 NOKIA CORP \\\n1 NOKIA NETWORKS 2 COMPANY 2125445 NOKIA CORP \n2 NOKIA CORPORATION 2 COMPANY 2125445 NOKIA CORP \n3 NOKIA CORPORATION 2 COMPANY 2125445 NOKIA CORP \n4 NOKIA NETWORKS 2 COMPANY 2125445 NOKIA CORP \n... ... ... ... ... ... \n354633 WONG, Chun Lok 0 UNKNOWN 188836234 WONG, Chun Lok \n354634 XIAONING YE 0 UNKNOWN 188836257 XIAONING YE \n354635 ZAI LAB (US) LLC 0 UNKNOWN 188836321 ZAI LAB (US) LLC \n354636 ZHANG, Haocheng 0 UNKNOWN 188836333 ZHANG, Haocheng \n354637 ZHANG, Yangjun 0 UNKNOWN 188836337 ZHANG, Yangjun \n\n han_harmonized psn_sector_primary \n0 2 COMPANY \n1 2 COMPANY \n2 2 COMPANY \n3 2 COMPANY \n4 2 COMPANY \n... ... ... \n354633 0 UNKNOWN \n354634 0 UNKNOWN \n354635 0 UNKNOWN \n354636 0 UNKNOWN \n354637 0 UNKNOWN \n\n[354638 rows x 17 columns]", + "text/html": "
\n\n\n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n
person_idperson_nameperson_name_orig_lgperson_addressperson_ctry_codenutsnuts_leveldoc_std_name_iddoc_std_namepsn_idpsn_namepsn_levelpsn_sectorhan_idhan_namehan_harmonizedpsn_sector_primary
01Nokia CorporationNokia CorporationKeilalahdentie 4,02150 EspooFIFI1B131NOKIA CORP23782051NOKIA CORPORATION2COMPANY2125445NOKIA CORP2COMPANY
1128Nokia Siemens Networks OyNokia Siemens Networks OyKaraportti 3,02610 EspooFIFI1B13112NOKIA SIEMENS NETWORKS OY23782129NOKIA NETWORKS2COMPANY2125445NOKIA CORP2COMPANY
25217785Nokia CorporationNokia CorporationEspooFIFI01NOKIA CORP23782051NOKIA CORPORATION2COMPANY2125445NOKIA CORP2COMPANY
35217811Nokia CorporationNokia CorporationNaNFIFI01NOKIA CORP23782051NOKIA CORPORATION2COMPANY2125445NOKIA CORP2COMPANY
45232170Nokia Siemens Networks OyNokia Siemens Networks OyEspooFIFI0112NOKIA SIEMENS NETWORKS OY23782129NOKIA NETWORKS2COMPANY2125445NOKIA CORP2COMPANY
......................................................
35463388836234WONG, Chun LokWONG, Chun LokNaNUSNaN930867225WONG CHUN LOK188836234WONG, Chun Lok0UNKNOWN188836234WONG, Chun Lok0UNKNOWN
35463488836257XIAONING YEXIAONING YEPortland, Oregon USUSNaN98004293XIAONING YE188836257XIAONING YE0UNKNOWN188836257XIAONING YE0UNKNOWN
35463588836321ZAI LAB (US) LLCZAI LAB (US) LLCNaNUSNaN939363494ZAI LAB US LLC188836321ZAI LAB (US) LLC0UNKNOWN188836321ZAI LAB (US) LLC0UNKNOWN
35463688836333ZHANG, Haocheng张皓程NaNUSNaN97682590ZHANG HAOCHENG188836333ZHANG, Haocheng0UNKNOWN188836333ZHANG, Haocheng0UNKNOWN
35463788836337ZHANG, YangjunZHANG, YangjunNaNUSNaN92112344ZHANG YANGJUN188836337ZHANG, Yangjun0UNKNOWN188836337ZHANG, Yangjun0UNKNOWN
\n

354638 rows × 17 columns

\n
" + }, + "execution_count": 26, "metadata": {}, "output_type": "execute_result" } @@ -170,14 +179,23 @@ }, { "cell_type": "code", - "execution_count": 38, + "execution_count": 27, "outputs": [ { "data": { - "text/plain": " han_id psn_sector_primary\n0 264 GOV NON-PROFIT UNIVERSITY\n1 627 COMPANY\n2 974 COMPANY\n3 1480 COMPANY\n4 1699 COMPANY\n... ... ...\n106154 185719932 UNKNOWN\n106155 185720336 UNKNOWN\n106156 185720376 UNKNOWN\n106157 185720469 UNKNOWN\n106158 185720500 UNKNOWN\n\n[106159 rows x 2 columns]", - "text/html": "
\n\n\n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n
han_idpsn_sector_primary
0264GOV NON-PROFIT UNIVERSITY
1627COMPANY
2974COMPANY
31480COMPANY
41699COMPANY
.........
106154185719932UNKNOWN
106155185720336UNKNOWN
106156185720376UNKNOWN
106157185720469UNKNOWN
106158185720500UNKNOWN
\n

106159 rows × 2 columns

\n
" + "text/plain": " han_id psn_sector_primary\n0 32 COMPANY\n1 54 COMPANY\n2 83 COMPANY\n3 200 COMPANY\n4 264 GOV NON-PROFIT UNIVERSITY\n... ... ...\n335519 188836234 UNKNOWN\n335520 188836257 UNKNOWN\n335521 188836321 UNKNOWN\n335522 188836333 UNKNOWN\n335523 188836337 UNKNOWN\n\n[335524 rows x 2 columns]", + "text/html": "
\n\n\n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n
han_idpsn_sector_primary
032COMPANY
154COMPANY
283COMPANY
3200COMPANY
4264GOV NON-PROFIT UNIVERSITY
.........
335519188836234UNKNOWN
335520188836257UNKNOWN
335521188836321UNKNOWN
335522188836333UNKNOWN
335523188836337UNKNOWN
\n

335524 rows × 2 columns

\n
" + }, + "execution_count": 18, + "metadata": {}, + "output_type": "execute_result" + }, + { + "data": { + "text/plain": " han_id psn_sector_primary\n0 32 COMPANY\n1 54 COMPANY\n2 83 COMPANY\n3 200 COMPANY\n4 264 GOV NON-PROFIT UNIVERSITY\n... ... ...\n335519 188836234 UNKNOWN\n335520 188836257 UNKNOWN\n335521 188836321 UNKNOWN\n335522 188836333 UNKNOWN\n335523 188836337 UNKNOWN\n\n[335524 rows x 2 columns]", + "text/html": "
\n\n\n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n
han_idpsn_sector_primary
032COMPANY
154COMPANY
283COMPANY
3200COMPANY
4264GOV NON-PROFIT UNIVERSITY
.........
335519188836234UNKNOWN
335520188836257UNKNOWN
335521188836321UNKNOWN
335522188836333UNKNOWN
335523188836337UNKNOWN
\n

335524 rows × 2 columns

\n
" }, - "execution_count": 38, + "execution_count": 27, "metadata": {}, "output_type": "execute_result" } @@ -191,7 +209,16 @@ }, { "cell_type": "code", - "execution_count": 20, + "execution_count": 27, + "outputs": [], + "source": [], + "metadata": { + "collapsed": false + } + }, + { + "cell_type": "code", + "execution_count": 28, "outputs": [], "source": [ "appln_merge = appln.merge(appln_title, on=\"appln_id\")#.merge(appln_pers,on=\"appln_id\")\n", @@ -203,7 +230,7 @@ }, { "cell_type": "code", - "execution_count": 21, + "execution_count": 29, "outputs": [], "source": [ "person_merge = appln_pers.merge(pers,on=\"person_id\")\n", @@ -215,13 +242,13 @@ }, { "cell_type": "code", - "execution_count": 18, + "execution_count": 30, "outputs": [ { "data": { - "text/plain": "array(['FI', 'NL', 'FR', 'DE', 'DK', 'AT', 'SE', 'BE', 'TW', 'LU', 'CN',\n 'IT', 'HU', 'IE', 'SI', 'CZ', 'ES', 'HK', 'PL', 'CY', 'SK', 'PT',\n 'LT', 'EE', 'MT', 'GR', 'RO', 'BG', 'HR', 'MO', 'LV'], dtype=object)" + "text/plain": "array(['FI', 'NL', 'FR', 'CH', 'US', 'DE', 'DK', 'AT', 'SE', 'BE', 'CN',\n 'IT', 'LU', 'IE', 'SI', 'HK', 'MO', 'CZ', 'ES', 'NO', 'PL', 'HU',\n 'CY', 'SK', 'PT', 'EE', 'MT', 'GR', 'RO', 'BG', 'LT', 'HR', 'LV'],\n dtype=object)" }, - "execution_count": 18, + "execution_count": 30, "metadata": {}, "output_type": "execute_result" } @@ -232,39 +259,6 @@ "metadata": { "collapsed": false } - }, - { - "cell_type": "code", - "execution_count": 16, - "outputs": [ - { - "ename": "KeyError", - "evalue": "'cry_code'", - "output_type": "error", - "traceback": [ - "\u001B[1;31m---------------------------------------------------------------------------\u001B[0m", - "\u001B[1;31mKeyError\u001B[0m Traceback (most recent call last)", - "File \u001B[1;32m~\\.conda\\envs\\MOME_BIGDATA\\lib\\site-packages\\pandas\\core\\indexes\\base.py:3649\u001B[0m, in \u001B[0;36mIndex.get_loc\u001B[1;34m(self, key)\u001B[0m\n\u001B[0;32m 3648\u001B[0m \u001B[38;5;28;01mtry\u001B[39;00m:\n\u001B[1;32m-> 3649\u001B[0m \u001B[38;5;28;01mreturn\u001B[39;00m \u001B[38;5;28;43mself\u001B[39;49m\u001B[38;5;241;43m.\u001B[39;49m\u001B[43m_engine\u001B[49m\u001B[38;5;241;43m.\u001B[39;49m\u001B[43mget_loc\u001B[49m\u001B[43m(\u001B[49m\u001B[43mcasted_key\u001B[49m\u001B[43m)\u001B[49m\n\u001B[0;32m 3650\u001B[0m \u001B[38;5;28;01mexcept\u001B[39;00m \u001B[38;5;167;01mKeyError\u001B[39;00m \u001B[38;5;28;01mas\u001B[39;00m err:\n", - "File \u001B[1;32m~\\.conda\\envs\\MOME_BIGDATA\\lib\\site-packages\\pandas\\_libs\\index.pyx:147\u001B[0m, in \u001B[0;36mpandas._libs.index.IndexEngine.get_loc\u001B[1;34m()\u001B[0m\n", - "File \u001B[1;32m~\\.conda\\envs\\MOME_BIGDATA\\lib\\site-packages\\pandas\\_libs\\index.pyx:176\u001B[0m, in \u001B[0;36mpandas._libs.index.IndexEngine.get_loc\u001B[1;34m()\u001B[0m\n", - "File \u001B[1;32mpandas\\_libs\\hashtable_class_helper.pxi:7080\u001B[0m, in \u001B[0;36mpandas._libs.hashtable.PyObjectHashTable.get_item\u001B[1;34m()\u001B[0m\n", - "File \u001B[1;32mpandas\\_libs\\hashtable_class_helper.pxi:7088\u001B[0m, in \u001B[0;36mpandas._libs.hashtable.PyObjectHashTable.get_item\u001B[1;34m()\u001B[0m\n", - "\u001B[1;31mKeyError\u001B[0m: 'cry_code'", - "\nThe above exception was the direct cause of the following exception:\n", - "\u001B[1;31mKeyError\u001B[0m Traceback (most recent call last)", - "Cell \u001B[1;32mIn[16], line 1\u001B[0m\n\u001B[1;32m----> 1\u001B[0m \u001B[43mperson_merge\u001B[49m\u001B[43m[\u001B[49m\u001B[38;5;124;43m\"\u001B[39;49m\u001B[38;5;124;43mcry_code\u001B[39;49m\u001B[38;5;124;43m\"\u001B[39;49m\u001B[43m]\u001B[49m\u001B[38;5;241m.\u001B[39munique()\n", - "File \u001B[1;32m~\\.conda\\envs\\MOME_BIGDATA\\lib\\site-packages\\pandas\\core\\frame.py:3745\u001B[0m, in \u001B[0;36mDataFrame.__getitem__\u001B[1;34m(self, key)\u001B[0m\n\u001B[0;32m 3743\u001B[0m \u001B[38;5;28;01mif\u001B[39;00m \u001B[38;5;28mself\u001B[39m\u001B[38;5;241m.\u001B[39mcolumns\u001B[38;5;241m.\u001B[39mnlevels \u001B[38;5;241m>\u001B[39m \u001B[38;5;241m1\u001B[39m:\n\u001B[0;32m 3744\u001B[0m \u001B[38;5;28;01mreturn\u001B[39;00m \u001B[38;5;28mself\u001B[39m\u001B[38;5;241m.\u001B[39m_getitem_multilevel(key)\n\u001B[1;32m-> 3745\u001B[0m indexer \u001B[38;5;241m=\u001B[39m \u001B[38;5;28;43mself\u001B[39;49m\u001B[38;5;241;43m.\u001B[39;49m\u001B[43mcolumns\u001B[49m\u001B[38;5;241;43m.\u001B[39;49m\u001B[43mget_loc\u001B[49m\u001B[43m(\u001B[49m\u001B[43mkey\u001B[49m\u001B[43m)\u001B[49m\n\u001B[0;32m 3746\u001B[0m \u001B[38;5;28;01mif\u001B[39;00m is_integer(indexer):\n\u001B[0;32m 3747\u001B[0m indexer \u001B[38;5;241m=\u001B[39m [indexer]\n", - "File \u001B[1;32m~\\.conda\\envs\\MOME_BIGDATA\\lib\\site-packages\\pandas\\core\\indexes\\base.py:3651\u001B[0m, in \u001B[0;36mIndex.get_loc\u001B[1;34m(self, key)\u001B[0m\n\u001B[0;32m 3649\u001B[0m \u001B[38;5;28;01mreturn\u001B[39;00m \u001B[38;5;28mself\u001B[39m\u001B[38;5;241m.\u001B[39m_engine\u001B[38;5;241m.\u001B[39mget_loc(casted_key)\n\u001B[0;32m 3650\u001B[0m \u001B[38;5;28;01mexcept\u001B[39;00m \u001B[38;5;167;01mKeyError\u001B[39;00m \u001B[38;5;28;01mas\u001B[39;00m err:\n\u001B[1;32m-> 3651\u001B[0m \u001B[38;5;28;01mraise\u001B[39;00m \u001B[38;5;167;01mKeyError\u001B[39;00m(key) \u001B[38;5;28;01mfrom\u001B[39;00m \u001B[38;5;21;01merr\u001B[39;00m\n\u001B[0;32m 3652\u001B[0m \u001B[38;5;28;01mexcept\u001B[39;00m \u001B[38;5;167;01mTypeError\u001B[39;00m:\n\u001B[0;32m 3653\u001B[0m \u001B[38;5;66;03m# If we have a listlike key, _check_indexing_error will raise\u001B[39;00m\n\u001B[0;32m 3654\u001B[0m \u001B[38;5;66;03m# InvalidIndexError. Otherwise we fall through and re-raise\u001B[39;00m\n\u001B[0;32m 3655\u001B[0m \u001B[38;5;66;03m# the TypeError.\u001B[39;00m\n\u001B[0;32m 3656\u001B[0m \u001B[38;5;28mself\u001B[39m\u001B[38;5;241m.\u001B[39m_check_indexing_error(key)\n", - "\u001B[1;31mKeyError\u001B[0m: 'cry_code'" - ] - } - ], - "source": [ - "person_merge[\"cry_code\"].unique()" - ], - "metadata": { - "collapsed": false - } } ], "metadata": { diff --git a/PATSTAT/patstat_cpc_parse.ipynb b/PATSTAT/patstat_cpc_parse.ipynb index 057f87c..e6a0cce 100644 --- a/PATSTAT/patstat_cpc_parse.ipynb +++ b/PATSTAT/patstat_cpc_parse.ipynb @@ -2,7 +2,7 @@ "cells": [ { "cell_type": "code", - "execution_count": 1, + "execution_count": 60, "id": "a8be6839", "metadata": {}, "outputs": [], @@ -19,7 +19,7 @@ }, { "cell_type": "code", - "execution_count": 4, + "execution_count": 61, "id": "211ba466", "metadata": {}, "outputs": [], @@ -39,7 +39,7 @@ }, { "cell_type": "code", - "execution_count": 3, + "execution_count": 62, "id": "f878b151", "metadata": {}, "outputs": [], @@ -59,7 +59,7 @@ }, { "cell_type": "code", - "execution_count": 6, + "execution_count": 63, "id": "95ea20da", "metadata": {}, "outputs": [], @@ -103,7 +103,7 @@ }, { "cell_type": "code", - "execution_count": 4, + "execution_count": 63, "id": "907d9c3e", "metadata": {}, "outputs": [], @@ -111,7 +111,7 @@ }, { "cell_type": "code", - "execution_count": 7, + "execution_count": 64, "id": "1be8971a", "metadata": {}, "outputs": [ @@ -134,7 +134,7 @@ }, { "cell_type": "code", - "execution_count": 8, + "execution_count": 65, "id": "b1274c34", "metadata": {}, "outputs": [], @@ -145,7 +145,7 @@ }, { "cell_type": "code", - "execution_count": 9, + "execution_count": 66, "id": "2a7e39ee", "metadata": {}, "outputs": [], @@ -164,7 +164,7 @@ }, { "cell_type": "code", - "execution_count": 10, + "execution_count": 67, "id": "e31a013f", "metadata": {}, "outputs": [ @@ -172,7 +172,7 @@ "data": { "text/plain": "[('A', 'HUMAN NECESSITIES'),\n ('A01',\n 'AGRICULTURE; FORESTRY; ANIMAL HUSBANDRY; HUNTING; TRAPPING; FISHING'),\n ('A01B',\n 'SOIL WORKING IN AGRICULTURE OR FORESTRY; PARTS, DETAILS, OR ACCESSORIES OF AGRICULTURAL MACHINES OR IMPLEMENTS, IN GENERAL (making or covering furrows or holes for sowing, planting, or manuring A01C5/00; soil working for engineering purposes E01, E02, E21; {measuring areas for agricultural purposes G01B})'),\n ('A01B1/06',\n 'Hoes; Hand cultivators {(rakes A01D7/00; forks A01D9/00; picks B25D)}'),\n ('A01B1/065', '{powered}')]" }, - "execution_count": 10, + "execution_count": 67, "metadata": {}, "output_type": "execute_result" } @@ -183,7 +183,7 @@ }, { "cell_type": "code", - "execution_count": 12, + "execution_count": 68, "id": "f09a616c", "metadata": {}, "outputs": [ @@ -192,7 +192,7 @@ "text/plain": " cpc_id cpc_name section class \n0 A HUMAN NECESSITIES A None \\\n1 A01 AGRICULTURE; FORESTRY; ANIMAL HUSBANDRY; HUNTI... A 01 \n2 A01B SOIL WORKING IN AGRICULTURE OR FORESTRY; PARTS... A 01 \n3 A01B1/00 Hand tools (edge trimmers for lawns A01G3/06 ... A 01 \n4 A01B1/02 Spades; Shovels {(hand-operated dredgers E02F3... A 01 \n\n subclass group main_group cpc_version \n0 None None None 2023 \\\n1 None None None 2023 \n2 B None None 2023 \n3 B 1 00 2023 \n4 B 1 02 2023 \n\n version https://git-lfs.github.com/spec/v1 \n0 NaN \\\n1 NaN \n2 NaN \n3 NaN \n4 NaN \n\n cpc_taxonomy \n0 [(A, HUMAN NECESSITIES)] \n1 [(A, HUMAN NECESSITIES), (A01, AGRICULTURE; FO... \n2 [(A, HUMAN NECESSITIES), (A01, AGRICULTURE; FO... \n3 [(A, HUMAN NECESSITIES), (A01, AGRICULTURE; FO... \n4 [(A, HUMAN NECESSITIES), (A01, AGRICULTURE; FO... ", "text/html": "
\n\n\n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n
cpc_idcpc_namesectionclasssubclassgroupmain_groupcpc_versionversion https://git-lfs.github.com/spec/v1cpc_taxonomy
0AHUMAN NECESSITIESANoneNoneNoneNone2023NaN[(A, HUMAN NECESSITIES)]
1A01AGRICULTURE; FORESTRY; ANIMAL HUSBANDRY; HUNTI...A01NoneNoneNone2023NaN[(A, HUMAN NECESSITIES), (A01, AGRICULTURE; FO...
2A01BSOIL WORKING IN AGRICULTURE OR FORESTRY; PARTS...A01BNoneNone2023NaN[(A, HUMAN NECESSITIES), (A01, AGRICULTURE; FO...
3A01B1/00Hand tools (edge trimmers for lawns A01G3/06 ...A01B1002023NaN[(A, HUMAN NECESSITIES), (A01, AGRICULTURE; FO...
4A01B1/02Spades; Shovels {(hand-operated dredgers E02F3...A01B1022023NaN[(A, HUMAN NECESSITIES), (A01, AGRICULTURE; FO...
\n
" }, - "execution_count": 12, + "execution_count": 68, "metadata": {}, "output_type": "execute_result" } @@ -204,7 +204,7 @@ }, { "cell_type": "code", - "execution_count": 13, + "execution_count": 69, "id": "f3fa8bf3", "metadata": {}, "outputs": [ @@ -226,7 +226,7 @@ }, { "cell_type": "code", - "execution_count": 11, + "execution_count": 70, "id": "58701721", "metadata": {}, "outputs": [], @@ -244,13 +244,13 @@ }, { "cell_type": "code", - "execution_count": 49, + "execution_count": 71, "outputs": [ { "data": { "text/plain": "'neural network|machine learn|deep learn|remote sensing|convolutional neural|internet of things|feature extraction|genetic algorithm|big data|artificial intelligence|data driven|support vector machine|logistic regression not p=|optimization algorithm|principal component analysis|artificial neural network|swarm optimization|regularization|linear regression not p=|optimization algorithm|random forest|cloud computing|reinforcement learning|computer vision|kalman filter|image processing|data mining|evolutionary algorithm|edge computing|supervised learning|computational modeling|pattern recognition|image classification|long short-term memor|robotics|image segmentation|convex optimization|covariance matri|attention mechanism|markov chain|object detection not brain|clustering algorithm|recurrent neural network|data augmentation|transfer learning|adversarial network|decision tree|multi agent system|fuzzy set|convolutional network|image reconstruction|data analytic|smart grid|autoencoder|fuzzy logic|radial basis function|bayesian network|dimensionality reduction|face recognition not brain|gaussian process|anomaly detection|k-nearest neighbor|natural language processing|monte carlo method|large dataset|gradient descent|support vector regression|extreme learning machine|perceptron|model selection|ensemble learning|representation learning|recommender system|target tracking|singular value decomposition|feature learning|smart city|sentiment analy|markov decision process|k-means clustering|independent component analysis|brain computer interface|human-computer interaction|markov chain monte carlo|hierarchical clustering|semantic web|semi-supervised learning|human-robot interact|knowledge graph|speech recognition not brain|ensemble model|fog computing|mapreduce|evolutionary computation|data science|text mining|generative model|active learning|swarm intelligence|multi-task learning|language model|collaborative filtering|backpropagation|machine vision|computer-aided diagnosis|gated recurrent unit|lagrange multiplier|expert system|learning rate|hadoop|markov process|nonlinear optimization|learning system|self-organizing map|smart manufacturing|smart home|few shot learning|few-shot learning|meta-learning|meta learning|adversarial training|zero-shot learning|word embedding|expectation maximization algorithm|stochastic gradient descent|ridge regression|deep belief network|non-negative matrix factorization|affective computing|latent dirichlet allocation|kernel method|kernel learning|feature engineering|variational inference|image representation|manifold learning|adversarial example|knowledge distillation|time series forecast|variational autoencoder|lasso regression|smart energy|dbscan|multi-label classification|intelligent robot|ubiquitous computing|gaussian mixture models|smart technolog|boltzmann machine|smart buildings|predictive analytic|pervasive computing|smart agriculture|capsule network|human-in-the-loop|intelligent agent|ai applications|word vector|transformer model|facial recognition|unstructured data|restricted boltzmann machine|albert|lifelong learning|autonomous agents|chatbot|cholesky decomposition|nosql|nosql|explainable ai|seq2seq|probabilistic graphical model|qr decomposition|unsupervised deep learning|data warehouse|quantum machine learning|continual learning|smart environment|multimodal learning|smart health|artificial immune system|swarm robotics|kernel machine|latent factor model|eigendecomposition|adversarial machine|adversarial machine learning|smart mobility|sequence-to-sequence model|eigen decomposition|adversarial robustness|smart parking|adversarial neural|roberta|bidirectional encoder representations from transformer|locally linear embedding|hebbian learning|one-shot learning|multimodal representation|smart tourism|entity extraction|adaptive moment estimation|ontology learning|topic modeling|relational database'" }, - "execution_count": 49, + "execution_count": 71, "metadata": {}, "output_type": "execute_result" } @@ -269,19 +269,29 @@ }, { "cell_type": "code", - "execution_count": 54, + "execution_count": null, + "outputs": [], + "source": [], + "metadata": { + "collapsed": false + } + }, + { + "cell_type": "code", + "execution_count": 72, "outputs": [ { "data": { "text/plain": " cpc_id cpc_name \n12725 A61B1/000096 {using artificial intelligence} \\\n13764 A61B5/7264 {Classification of physiological signals or da... \n13897 A61B6/52 {Devices using data or image processing specia... \n14016 A61B8/52 {Devices using data or image processing specia... \n15252 A61B2018/0069 {using fuzzy logic} \n... ... ... \n250685 Y10S707/99946 Object-oriented database structure network \n250686 Y10S707/99947 Object-oriented database structure reference \n250687 Y10S707/99948 Application of database or data structure, e.g... \n250688 Y10S707/99951 File or database maintenance \n250703 Y10S715/968 interface for database querying and retrieval \n\n section class subclass group main_group cpc_version \n12725 A 61 B 1 000096 2023 \\\n13764 A 61 B 5 7264 2023 \n13897 A 61 B 6 52 2023 \n14016 A 61 B 8 52 2023 \n15252 A 61 B 2018 0069 2023 \n... ... ... ... ... ... ... \n250685 Y 10 S 707 99946 2023 \n250686 Y 10 S 707 99947 2023 \n250687 Y 10 S 707 99948 2023 \n250688 Y 10 S 707 99951 2023 \n250703 Y 10 S 715 968 2023 \n\n version https://git-lfs.github.com/spec/v1 \n12725 NaN \\\n13764 NaN \n13897 NaN \n14016 NaN \n15252 NaN \n... ... \n250685 NaN \n250686 NaN \n250687 NaN \n250688 NaN \n250703 NaN \n\n cpc_taxonomy \n12725 [(A, HUMAN NECESSITIES), (A61, MEDICAL OR VETE... \n13764 [(A, HUMAN NECESSITIES), (A61, MEDICAL OR VETE... \n13897 [(A, HUMAN NECESSITIES), (A61, MEDICAL OR VETE... \n14016 [(A, HUMAN NECESSITIES), (A61, MEDICAL OR VETE... \n15252 [(A, HUMAN NECESSITIES), (A61, MEDICAL OR VETE... \n... ... \n250685 [(Y, GENERAL TAGGING OF NEW TECHNOLOGICAL DEVE... \n250686 [(Y, GENERAL TAGGING OF NEW TECHNOLOGICAL DEVE... \n250687 [(Y, GENERAL TAGGING OF NEW TECHNOLOGICAL DEVE... \n250688 [(Y, GENERAL TAGGING OF NEW TECHNOLOGICAL DEVE... \n250703 [(Y, GENERAL TAGGING OF NEW TECHNOLOGICAL DEVE... \n\n[317 rows x 10 columns]", "text/html": "
\n\n\n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n
cpc_idcpc_namesectionclasssubclassgroupmain_groupcpc_versionversion https://git-lfs.github.com/spec/v1cpc_taxonomy
12725A61B1/000096{using artificial intelligence}A61B10000962023NaN[(A, HUMAN NECESSITIES), (A61, MEDICAL OR VETE...
13764A61B5/7264{Classification of physiological signals or da...A61B572642023NaN[(A, HUMAN NECESSITIES), (A61, MEDICAL OR VETE...
13897A61B6/52{Devices using data or image processing specia...A61B6522023NaN[(A, HUMAN NECESSITIES), (A61, MEDICAL OR VETE...
14016A61B8/52{Devices using data or image processing specia...A61B8522023NaN[(A, HUMAN NECESSITIES), (A61, MEDICAL OR VETE...
15252A61B2018/0069{using fuzzy logic}A61B201800692023NaN[(A, HUMAN NECESSITIES), (A61, MEDICAL OR VETE...
.................................
250685Y10S707/99946Object-oriented database structure networkY10S707999462023NaN[(Y, GENERAL TAGGING OF NEW TECHNOLOGICAL DEVE...
250686Y10S707/99947Object-oriented database structure referenceY10S707999472023NaN[(Y, GENERAL TAGGING OF NEW TECHNOLOGICAL DEVE...
250687Y10S707/99948Application of database or data structure, e.g...Y10S707999482023NaN[(Y, GENERAL TAGGING OF NEW TECHNOLOGICAL DEVE...
250688Y10S707/99951File or database maintenanceY10S707999512023NaN[(Y, GENERAL TAGGING OF NEW TECHNOLOGICAL DEVE...
250703Y10S715/968interface for database querying and retrievalY10S7159682023NaN[(Y, GENERAL TAGGING OF NEW TECHNOLOGICAL DEVE...
\n

317 rows × 10 columns

\n
" }, - "execution_count": 54, + "execution_count": 72, "metadata": {}, "output_type": "execute_result" } ], "source": [ + "#dummy search\n", "scope_df = cpc_ids[cpc_ids[\"cpc_name\"].str.lower().str.contains(\"machine learn|neural network|deep learn|deep network|artificial intel*| big data|database|recommender system|computer vision|image processing|language model|language processing|fuzzy logic|principal component|image classification|video classification\", regex=True, na=False)]\n", "scope_df" ], @@ -291,7 +301,29 @@ }, { "cell_type": "code", - "execution_count": 58, + "execution_count": 73, + "outputs": [ + { + "data": { + "text/plain": " cpc_id cpc_name \n12725 A61B1/000096 {using artificial intelligence} \\\n13746 A61B5/72 {Signal processing specially adapted for physi... \n13764 A61B5/7264 {Classification of physiological signals or da... \n13897 A61B6/52 {Devices using data or image processing specia... \n14016 A61B8/52 {Devices using data or image processing specia... \n... ... ... \n246159 Y10S128/924 using artificial intelligence \n246160 Y10S128/925 Neural network \n248454 Y10S323/909 Remote sensing \n250570 Y10S706/00 Data processing: artificial intelligence \n250571 Y10S706/90 Fuzzy logic \n\n section class subclass group main_group cpc_version \n12725 A 61 B 1 000096 2023 \\\n13746 A 61 B 5 72 2023 \n13764 A 61 B 5 7264 2023 \n13897 A 61 B 6 52 2023 \n14016 A 61 B 8 52 2023 \n... ... ... ... ... ... ... \n246159 Y 10 S 128 924 2023 \n246160 Y 10 S 128 925 2023 \n248454 Y 10 S 323 909 2023 \n250570 Y 10 S 706 00 2023 \n250571 Y 10 S 706 90 2023 \n\n version https://git-lfs.github.com/spec/v1 \n12725 NaN \\\n13746 NaN \n13764 NaN \n13897 NaN \n14016 NaN \n... ... \n246159 NaN \n246160 NaN \n248454 NaN \n250570 NaN \n250571 NaN \n\n cpc_taxonomy \n12725 [(A, HUMAN NECESSITIES), (A61, MEDICAL OR VETE... \n13746 [(A, HUMAN NECESSITIES), (A61, MEDICAL OR VETE... \n13764 [(A, HUMAN NECESSITIES), (A61, MEDICAL OR VETE... \n13897 [(A, HUMAN NECESSITIES), (A61, MEDICAL OR VETE... \n14016 [(A, HUMAN NECESSITIES), (A61, MEDICAL OR VETE... \n... ... \n246159 [(Y, GENERAL TAGGING OF NEW TECHNOLOGICAL DEVE... \n246160 [(Y, GENERAL TAGGING OF NEW TECHNOLOGICAL DEVE... \n248454 [(Y, GENERAL TAGGING OF NEW TECHNOLOGICAL DEVE... \n250570 [(Y, GENERAL TAGGING OF NEW TECHNOLOGICAL DEVE... \n250571 [(Y, GENERAL TAGGING OF NEW TECHNOLOGICAL DEVE... \n\n[358 rows x 10 columns]", + "text/html": "
\n\n\n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n
cpc_idcpc_namesectionclasssubclassgroupmain_groupcpc_versionversion https://git-lfs.github.com/spec/v1cpc_taxonomy
12725A61B1/000096{using artificial intelligence}A61B10000962023NaN[(A, HUMAN NECESSITIES), (A61, MEDICAL OR VETE...
13746A61B5/72{Signal processing specially adapted for physi...A61B5722023NaN[(A, HUMAN NECESSITIES), (A61, MEDICAL OR VETE...
13764A61B5/7264{Classification of physiological signals or da...A61B572642023NaN[(A, HUMAN NECESSITIES), (A61, MEDICAL OR VETE...
13897A61B6/52{Devices using data or image processing specia...A61B6522023NaN[(A, HUMAN NECESSITIES), (A61, MEDICAL OR VETE...
14016A61B8/52{Devices using data or image processing specia...A61B8522023NaN[(A, HUMAN NECESSITIES), (A61, MEDICAL OR VETE...
.................................
246159Y10S128/924using artificial intelligenceY10S1289242023NaN[(Y, GENERAL TAGGING OF NEW TECHNOLOGICAL DEVE...
246160Y10S128/925Neural networkY10S1289252023NaN[(Y, GENERAL TAGGING OF NEW TECHNOLOGICAL DEVE...
248454Y10S323/909Remote sensingY10S3239092023NaN[(Y, GENERAL TAGGING OF NEW TECHNOLOGICAL DEVE...
250570Y10S706/00Data processing: artificial intelligenceY10S706002023NaN[(Y, GENERAL TAGGING OF NEW TECHNOLOGICAL DEVE...
250571Y10S706/90Fuzzy logicY10S706902023NaN[(Y, GENERAL TAGGING OF NEW TECHNOLOGICAL DEVE...
\n

358 rows × 10 columns

\n
" + }, + "execution_count": 73, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "scope_df = cpc_ids[cpc_ids[\"cpc_name\"].str.lower().str.contains(keywords, regex=True, na=False)]\n", + "scope_df" + ], + "metadata": { + "collapsed": false + } + }, + { + "cell_type": "code", + "execution_count": 74, "id": "6c3baa5b", "metadata": {}, "outputs": [], @@ -303,13 +335,13 @@ }, { "cell_type": "code", - "execution_count": 59, + "execution_count": 75, "outputs": [ { "data": { "text/plain": "'WESTERN_CH_scope'" }, - "execution_count": 59, + "execution_count": 75, "metadata": {}, "output_type": "execute_result" } @@ -323,14 +355,14 @@ }, { "cell_type": "code", - "execution_count": 56, + "execution_count": 76, "outputs": [ { "data": { "text/plain": " cpc_id cpc_name \n0 A HUMAN NECESSITIES \\\n1 A01 AGRICULTURE; FORESTRY; ANIMAL HUSBANDRY; HUNTI... \n2 A01B SOIL WORKING IN AGRICULTURE OR FORESTRY; PARTS... \n3 A01B1/00 Hand tools (edge trimmers for lawns A01G3/06 ... \n4 A01B1/02 Spades; Shovels {(hand-operated dredgers E02F3... \n... ... ... \n260486 Y10T483/1873 Indexing matrix \n260487 Y10T483/1882 Rotary disc \n260488 Y10T483/1891 Chain or belt \n260489 Y10T483/19 Miscellaneous \n260490 NaN NaN \n\n section class subclass group main_group cpc_version \n0 A None None None None 2023 \\\n1 A 01 None None None 2023 \n2 A 01 B None None 2023 \n3 A 01 B 1 00 2023 \n4 A 01 B 1 02 2023 \n... ... ... ... ... ... ... \n260486 Y 10 T 483 1873 2023 \n260487 Y 10 T 483 1882 2023 \n260488 Y 10 T 483 1891 2023 \n260489 Y 10 T 483 19 2023 \n260490 NaN NaN NaN NaN NaN 2022 \n\n version https://git-lfs.github.com/spec/v1 \n0 NaN \\\n1 NaN \n2 NaN \n3 NaN \n4 NaN \n... ... \n260486 NaN \n260487 NaN \n260488 NaN \n260489 NaN \n260490 oid sha256:f138d6bdf2939ba576b96b633d81366123b... \n\n cpc_taxonomy data_scope \n0 [(A, HUMAN NECESSITIES)] False \n1 [(A, HUMAN NECESSITIES), (A01, AGRICULTURE; FO... False \n2 [(A, HUMAN NECESSITIES), (A01, AGRICULTURE; FO... False \n3 [(A, HUMAN NECESSITIES), (A01, AGRICULTURE; FO... False \n4 [(A, HUMAN NECESSITIES), (A01, AGRICULTURE; FO... False \n... ... ... \n260486 [(Y, GENERAL TAGGING OF NEW TECHNOLOGICAL DEVE... False \n260487 [(Y, GENERAL TAGGING OF NEW TECHNOLOGICAL DEVE... False \n260488 [(Y, GENERAL TAGGING OF NEW TECHNOLOGICAL DEVE... False \n260489 [(Y, GENERAL TAGGING OF NEW TECHNOLOGICAL DEVE... False \n260490 [] False \n\n[260491 rows x 11 columns]", "text/html": "
\n\n\n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n
cpc_idcpc_namesectionclasssubclassgroupmain_groupcpc_versionversion https://git-lfs.github.com/spec/v1cpc_taxonomydata_scope
0AHUMAN NECESSITIESANoneNoneNoneNone2023NaN[(A, HUMAN NECESSITIES)]False
1A01AGRICULTURE; FORESTRY; ANIMAL HUSBANDRY; HUNTI...A01NoneNoneNone2023NaN[(A, HUMAN NECESSITIES), (A01, AGRICULTURE; FO...False
2A01BSOIL WORKING IN AGRICULTURE OR FORESTRY; PARTS...A01BNoneNone2023NaN[(A, HUMAN NECESSITIES), (A01, AGRICULTURE; FO...False
3A01B1/00Hand tools (edge trimmers for lawns A01G3/06 ...A01B1002023NaN[(A, HUMAN NECESSITIES), (A01, AGRICULTURE; FO...False
4A01B1/02Spades; Shovels {(hand-operated dredgers E02F3...A01B1022023NaN[(A, HUMAN NECESSITIES), (A01, AGRICULTURE; FO...False
....................................
260486Y10T483/1873Indexing matrixY10T48318732023NaN[(Y, GENERAL TAGGING OF NEW TECHNOLOGICAL DEVE...False
260487Y10T483/1882Rotary discY10T48318822023NaN[(Y, GENERAL TAGGING OF NEW TECHNOLOGICAL DEVE...False
260488Y10T483/1891Chain or beltY10T48318912023NaN[(Y, GENERAL TAGGING OF NEW TECHNOLOGICAL DEVE...False
260489Y10T483/19MiscellaneousY10T483192023NaN[(Y, GENERAL TAGGING OF NEW TECHNOLOGICAL DEVE...False
260490NaNNaNNaNNaNNaNNaNNaN2022oid sha256:f138d6bdf2939ba576b96b633d81366123b...[]False
\n

260491 rows × 11 columns

\n
" }, - "execution_count": 56, + "execution_count": 76, "metadata": {}, "output_type": "execute_result" }