Patent hub分享 http://blog.sciencenet.cn/u/yngcan 关注专利分析,知识产权与法律

博文

patstat 数据库结构

已有 8449 次阅读 2013-7-28 18:35 |个人分类:专利|系统分类:科研笔记| 数据库, PATSTAT

PATSTAT是当前世界上收录最全,且专门面向专利分析人员、统计决策人员、高级研究人员的专利数据库。

该数据库的主要特点在于:

数据来源超过100个国家;

包含6000万专利申请和3000万专利授权(包括PCT申请)

还有一个特点,它是以CAV格式保存的,与DOCDB的XML格式有所区别。

一句话够全。

其数据库结构如下:


数据导入方法:(收集到了PATSTAT数据的SQL数据库创建及导入方式,分享之~~~~~~~)

1. 创建方式

Database: `patstat`

--

-- CREATED BY JULIO RAFFO (EPFL/CEMI)


-- --------------------------------------------------------


-- Table structure for table `tls201_appln`

--


CREATE TABLE `tls201_appln` (

 `appln_id` int(9) NOT NULL default '0',

 `appln_auth` char(2) NOT NULL default '',

 `appln_nr` char(15) NOT NULL default '',

 `appln_kind` char(2) NOT NULL default '00',

 `appln_filing_date` date NOT NULL default '0000-00-00',

 `ipr_type` char(2) NOT NULL default '',

 `appln_title_lg` char(2) NOT NULL default '',

 `appln_abstract_lg` char(2) NOT NULL default '',

 `internat_appln_id` int(9) NOT NULL default '0',

 PRIMARY KEY  (`appln_id`)

) ENGINE=MyISAM DEFAULT CHARSET=utf8;


-- --------------------------------------------------------


-- Table structure for table `tls202_appln_title`


CREATE TABLE `tls202_appln_title` (

 `appln_id` int(4) NOT NULL default '0',

 `appln_title` text NOT NULL,

 PRIMARY KEY  (`appln_id`)

) ENGINE=MyISAM DEFAULT CHARSET=utf8;


-- --------------------------------------------------------


--

-- Table structure for table `tls203_appln_abstr`

--


CREATE TABLE `tls203_appln_abstr` (

 `appln_id` int(4) NOT NULL default '0',

 `appln_abstract` text NOT NULL

) ENGINE=MyISAM DEFAULT CHARSET=utf8;


-- --------------------------------------------------------


-- Table structure for table `tls204_appln_prior`

--


CREATE TABLE `tls204_appln_prior` (

 `APPLN_ID` int(4) NOT NULL default '0',

 `PRIOR_APPLN_ID` int(4) NOT NULL default '0',

 `PRIOR_APPLN_SEQ_NR` smallint(2) NOT NULL default '0',

 PRIMARY KEY  (`APPLN_ID`,`PRIOR_APPLN_ID`)

) ENGINE=MyISAM DEFAULT CHARSET=utf8;


-- --------------------------------------------------------


-- Table structure for table `tls205_tech_rel`


CREATE TABLE `tls205_tech_rel` (

 `APPLN_ID` int(4) NOT NULL default '0',

 `TECH_REL_APPLN_ID` int(4) NOT NULL default '0',

 PRIMARY KEY  (`APPLN_ID`,`TECH_REL_APPLN_ID`)

) ENGINE=MyISAM DEFAULT CHARSET=utf8;


-- --------------------------------------------------------

 

-- Table structure for table `tls206_person`


CREATE TABLE `tls206_person` (

 `person_id` int(4) NOT NULL default '0',

 `person_ctry_code` varchar(2) NOT NULL default '',

 `doc_std_name_id` int(4) NOT NULL default '0',

 `person_name` text NOT NULL,

 `person_address` text NOT NULL,

 PRIMARY KEY  (`person_id`)

) ENGINE=MyISAM DEFAULT CHARSET=utf8;


-- --------------------------------------------------------


-- Table structure for table `tls207_pers_appln`


CREATE TABLE `tls207_pers_appln` (

 `person_id` int(4) NOT NULL default '0',

 `appln_id` int(4) NOT NULL default '0',

 `applt_seq_nr` smallint(2) NOT NULL default '0',

 `invt_seq_nr` smallint(2) NOT NULL default '0',

 KEY `person_id` (`person_id`),

 KEY `appln_id` (`appln_id`)

) ENGINE=MyISAM DEFAULT CHARSET=utf8;


-- --------------------------------------------------------


-- Table structure for table `tls208_doc_std_nms`


CREATE TABLE `tls208_doc_std_nms` (

 `doc_std_name_id` int(4) NOT NULL default '0',

 `doc_std_name` char(30) NOT NULL default '',

 PRIMARY KEY  (`doc_std_name_id`)

) ENGINE=MyISAM DEFAULT CHARSET=utf8;


-- --------------------------------------------------------


--

-- Table structure for table `tls209_appln_ipc`


CREATE TABLE `tls209_appln_ipc` (

 `appln_id` int(4) NOT NULL default '0',

 `ipc_class_symbol` char(15) NOT NULL default '',

 `ipc_version` date NOT NULL default '0000-00-00',

 `ipc_value` char(1) NOT NULL default '',

 `ipc_position` char(1) NOT NULL default '',

 `ipc_gener_auth` char(2) NOT NULL default '',

 PRIMARY KEY  (`appln_id`,`ipc_class_symbol`)

) ENGINE=MyISAM DEFAULT CHARSET=utf8;


-- --------------------------------------------------------


-- Table structure for table `tls210_appln_n_cls`


CREATE TABLE `tls210_appln_n_cls` (

 `appln_id` int(4) NOT NULL default '0',

 `nat_class_symbol` char(15) NOT NULL default ''

) ENGINE=MyISAM DEFAULT CHARSET=utf8;


-- --------------------------------------------------------


-- Table structure for table `tls211_pat_publn`


CREATE TABLE `tls211_pat_publn` (

 `pat_publn_id` int(11) NOT NULL default '0',

 `publn_auth` char(2) NOT NULL default '',

 `publn_nr` char(15) NOT NULL default '',

 `publn_kind` char(2) NOT NULL default '',

 `appln_id` int(11) NOT NULL default '0',

 `publn_date` date NOT NULL default '0001-01-01',

 `publn_lg` char(2) NOT NULL default '',

 PRIMARY KEY  (`pat_publn_id`)

) ENGINE=MyISAM DEFAULT CHARSET=utf8;


-- --------------------------------------------------------


-- Table structure for table `tls212_citation`


CREATE TABLE `tls212_citation` (

 `pat_publn_id` int(8) NOT NULL default '0',

 `citn_id` tinyint(3) NOT NULL default '0',

 `cited_pat_publn_id` int(8) NOT NULL default '0',

 `npl_publn_id` int(8) NOT NULL default '0',

 `pat_citn_seq_nr` tinyint(3) NOT NULL default '0',

 `npl_citn_seq_nr` tinyint(3) NOT NULL default '0',

 `citn_origin` char(5) NOT NULL default ''

) ENGINE=MyISAM DEFAULT CHARSET=utf8 PACK_KEYS=0;


-- --------------------------------------------------------


-- Table structure for table `tls214_npl_publn`


CREATE TABLE `tls214_npl_publn` (

 `npl_publn_id` int(4) NOT NULL default '0',

 `npl_biblio` text NOT NULL,

 PRIMARY KEY  (`npl_publn_id`)

) ENGINE=MyISAM DEFAULT CHARSET=utf8;


-- --------------------------------------------------------


-- Table structure for table `tls215_citn_categ`


CREATE TABLE `tls215_citn_categ` (

 `pat_publn_id` int(4) NOT NULL default '0',

 `citn_id` smallint(2) NOT NULL default '0',

 `citn_categ` char(1) NOT NULL default '',

 PRIMARY KEY  (`pat_publn_id`,`citn_id`,`citn_categ`)

) ENGINE=MyISAM DEFAULT CHARSET=utf8;


-- --------------------------------------------------------


-- Table structure for table `tls216_appln_contn`


CREATE TABLE `tls216_appln_contn` (

 `APPLN_ID` int(10) NOT NULL default '0',

 `PARENT_APPLN_ID` int(10) NOT NULL default '0',

 `CONTN_TYPE` char(3) NOT NULL default '',

 PRIMARY KEY  (`APPLN_ID`,`PARENT_APPLN_ID`)

) ENGINE=MyISAM DEFAULT CHARSET=utf8;


2. 导入方式

-- Database: `patstat`

--

-- BY JULIO RAFFO (EPFL/CEMI)

--

-- Patstat documentation info:


-- [mysqlimport]

-- verbose

-- local=1

-- ignore-lines=1

-- fields-terminated-by=","

-- fields-optionally-enclosed-by='"'

-- fields-escaped-by=""

-- lines-terminated-by="rn"

-- host="localhost"

-- password=""


-- --------------------------------------------------------


--

-- Uploading `tls201_appln`

-- ok (but 2 rows less)


LOAD DATA INFILE 'patstat/raw/tls201_part1.txt' INTO TABLE patstat.tls201_appln

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

IGNORE 1 LINES ;


LOAD DATA INFILE 'patstat/raw/tls201_part2.txt' INTO TABLE patstat.tls201_appln

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

IGNORE 1 LINES ;


LOAD DATA INFILE 'patstat/raw/tls201_part3.txt' INTO TABLE patstat.tls201_appln

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

IGNORE 1 LINES ;


-- --------------------------------------------------------


-- Uploading `tls202_title`

-- ok, but 13 rows less


LOAD DATA INFILE 'patstat/raw/tls202_part1.txt' INTO TABLE patstat.tls202_appln_title

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;


LOAD DATA INFILE 'patstat/raw/tls202_part2.txt' INTO TABLE patstat.tls202_appln_title

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;


LOAD DATA INFILE 'patstat/raw/tls202_part3.txt' INTO TABLE patstat.tls202_appln_title

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;


LOAD DATA INFILE 'patstat/raw/tls202_part4.txt' INTO TABLE patstat.tls202_appln_title

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;


LOAD DATA INFILE 'patstat/raw/tls202_part5.txt' INTO TABLE patstat.tls202_appln_title

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;


-- --------------------------------------------------------


-- Uploading `tls203_appln_abstr`

-- ok, but 89 rows less (after taking out primary key, due double ids)



LOAD DATA INFILE 'patstat/raw/tls203_part1.txt' INTO TABLE patstat.tls203_appln_abstr

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;


LOAD DATA INFILE 'patstat/raw/tls203_part2.txt' INTO TABLE patstat.tls203_appln_abstr

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;


LOAD DATA INFILE 'patstat/raw/tls203_part3.txt' INTO TABLE patstat.tls203_appln_abstr

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;


LOAD DATA INFILE 'patstat/raw/tls203_part4.txt' INTO TABLE patstat.tls203_appln_abstr

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;


LOAD DATA INFILE 'patstat/raw/tls203_part5.txt' INTO TABLE patstat.tls203_appln_abstr

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;


LOAD DATA INFILE 'patstat/raw/tls203_part6.txt' INTO TABLE patstat.tls203_appln_abstr

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;


LOAD DATA INFILE 'patstat/raw/tls203_part7.txt' INTO TABLE patstat.tls203_appln_abstr

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;


LOAD DATA INFILE 'patstat/raw/tls203_part8.txt' INTO TABLE patstat.tls203_appln_abstr

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;


LOAD DATA INFILE 'patstat/raw/tls203_part9.txt' INTO TABLE patstat.tls203_appln_abstr

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;


-- --------------------------------------------------------

-- Uploading `tls204_appln_prior`

-- ok


LOAD DATA INFILE 'patstat/raw/tls204_part1.txt' INTO TABLE patstat.tls204_appln_prior

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

IGNORE 1 LINES ;


-- --------------------------------------------------------


-- Uploading `tls205_tech_rel`

-- ok


LOAD DATA INFILE 'patstat/raw/tls205_part1.txt' INTO TABLE patstat.tls205_tech_rel

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

IGNORE 1 LINES ;


-- --------------------------------------------------------


-- Uploading `tls206_person`

-- ok, but 10 rows less


LOAD DATA INFILE 'patstat/raw/tls206_part1.txt' INTO TABLE patstat.tls206_person

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;


LOAD DATA INFILE 'patstat/raw/tls206_part2.txt' INTO TABLE patstat.tls206_person

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;


LOAD DATA INFILE 'patstat/raw/tls206_part3.txt' INTO TABLE patstat.tls206_person

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;


LOAD DATA INFILE 'patstat/raw/tls206_part4.txt' INTO TABLE patstat.tls206_person

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;

-- --------------------------------------------------------


-- Uploading `tls207_pers_appln`

-- ok (but 2 rows less)


LOAD DATA INFILE 'patstat/raw/tls207_part1.txt' INTO TABLE patstat.tls207_pers_appln

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

IGNORE 1 LINES ;


LOAD DATA INFILE 'patstat/raw/tls207_part2.txt' INTO TABLE patstat.tls207_pers_appln

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

IGNORE 1 LINES ;


LOAD DATA INFILE 'patstat/raw/tls207_part3.txt' INTO TABLE patstat.tls207_pers_appln

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

IGNORE 1 LINES ;


LOAD DATA INFILE 'patstat/raw/tls207_part4.txt' INTO TABLE patstat.tls207_pers_appln

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

IGNORE 1 LINES ;


-- --------------------------------------------------------


--

-- Uploading `tls208_doc_std_nms`

-- ok


LOAD DATA INFILE 'patstat/raw/tls208_part1.txt' INTO TABLE patstat.tls208_doc_std_nms

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;

-- --------------------------------------------------------

-- Uploading `tls209_appln_ipc`

-- ok (but 4 rows less)


LOAD DATA INFILE 'patstat/raw/tls209_part1.txt' INTO TABLE patstat.tls209_appln_ipc

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;


LOAD DATA INFILE 'patstat/raw/tls209_part2.txt' INTO TABLE patstat.tls209_appln_ipc

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;


LOAD DATA INFILE 'patstat/raw/tls209_part3.txt' INTO TABLE patstat.tls209_appln_ipc

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;


LOAD DATA INFILE 'patstat/raw/tls209_part4.txt' INTO TABLE patstat.tls209_appln_ipc

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;


LOAD DATA INFILE 'patstat/raw/tls209_part5.txt' INTO TABLE patstat.tls209_appln_ipc

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;


LOAD DATA INFILE 'patstat/raw/tls209_part6.txt' INTO TABLE patstat.tls209_appln_ipc

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;


LOAD DATA INFILE 'patstat/raw/tls209_part7.txt' INTO TABLE patstat.tls209_appln_ipc

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;


LOAD DATA INFILE 'patstat/raw/tls209_part8.txt' INTO TABLE patstat.tls209_appln_ipc

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;


LOAD DATA INFILE 'patstat/raw/tls209_part9.txt' INTO TABLE patstat.tls209_appln_ipc

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;

-- --------------------------------------------------------


-- Uploading `tls210_appln_n_cls`

-- ok


LOAD DATA INFILE 'patstat/raw/tls210_part1.txt' INTO TABLE patstat.tls210_appln_n_cls

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;


-- --------------------------------------------------------


-- Uploading `tls211_pat_publn`

-- ok (but 2 rows less)


LOAD DATA INFILE 'patstat/raw/tls211_part1.txt' INTO TABLE patstat.tls211_pat_publn

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;


LOAD DATA INFILE 'patstat/raw/tls211_part2.txt' INTO TABLE patstat.tls211_pat_publn

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;


LOAD DATA INFILE 'patstat/raw/tls211_part3.txt' INTO TABLE patstat.tls211_pat_publn

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;

-- --------------------------------------------------------

-- Uploading `tls212_citation`

-- ok (but 4 rows less)


LOAD DATA INFILE 'patstat/raw/tls212_part1.txt' INTO TABLE patstat.tls212_citation

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;


LOAD DATA INFILE 'patstat/raw/tls212_part2.txt' INTO TABLE patstat.tls212_citation

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;


LOAD DATA INFILE 'patstat/raw/tls212_part3.txt' INTO TABLE patstat.tls212_citation

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;


LOAD DATA INFILE 'patstat/raw/tls212_part4.txt' INTO TABLE patstat.tls212_citation

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;


LOAD DATA INFILE 'patstat/raw/tls212_part5.txt' INTO TABLE patstat.tls212_citation

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;


-- --------------------------------------------------------


--

-- Uploading `tls214_npl_publn`

-- ok (but 1 rows less)


LOAD DATA INFILE 'patstat/raw/tls214_part1.txt' INTO TABLE patstat.tls214_npl_publn

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;

-- --------------------------------------------------------

-- Uploading `tls215_citn_categ`

-- ok (but 7 rows less)


LOAD DATA INFILE 'patstat/raw/tls215_part1.txt' INTO TABLE patstat.tls215_citn_categ

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;

-- --------------------------------------------------------

-- Uploading `tls216_appln_contn`

-- ok


LOAD DATA INFILE 'patstat/raw/tls216_part1.txt' INTO TABLE patstat.tls216_appln_contn

FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'

lines terminated by 'rn'

IGNORE 1 LINES ;




https://wap.sciencenet.cn/blog-357889-712015.html

上一篇:EXCEL删除重复项的做法
下一篇:中国专利质量观察——利用专利家族(三国)指标
收藏 IP: 106.3.103.*| 热度|

0

该博文允许注册用户评论 请点击登录 评论 (2 个评论)

数据加载中...

Archiver|手机版|科学网 ( 京ICP备07017567号-12 )

GMT+8, 2024-4-30 21:03

Powered by ScienceNet.cn

Copyright © 2007- 中国科学报社

返回顶部