From 760e350ba3d27cd2d9664b530d91cafc8bf8bd46 Mon Sep 17 00:00:00 2001 From: firstdata-dev Date: Tue, 21 Apr 2026 10:05:38 +0800 Subject: [PATCH 1/3] feat: add 5 Chinese government data sources (AM batch, 2026-04-21) MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit - china-eximbank: Export-Import Bank of China (中国进出口银行) - policy bank for foreign trade finance - china-cdb: China Development Bank (国家开发银行) - largest policy bank for infrastructure finance - china-scidb: Science Data Bank (科学数据银行) - CAS national open scientific data repository - china-ngdc: National Genomics Data Center (国家基因组科学数据中心) - CAS genomics/bioinformatics data - china-cqc: China Quality Certification Centre (中国质量认证中心) - CCC/3C certification database --- .../sources/china/finance/banking/cdb.json | 65 +++++++++++++++++ .../china/finance/banking/eximbank.json | 66 ++++++++++++++++++ firstdata/sources/china/governance/cqc.json | 66 ++++++++++++++++++ firstdata/sources/china/research/ngdc.json | 69 +++++++++++++++++++ firstdata/sources/china/research/scidb.json | 65 +++++++++++++++++ 5 files changed, 331 insertions(+) create mode 100644 firstdata/sources/china/finance/banking/cdb.json create mode 100644 firstdata/sources/china/finance/banking/eximbank.json create mode 100644 firstdata/sources/china/governance/cqc.json create mode 100644 firstdata/sources/china/research/ngdc.json create mode 100644 firstdata/sources/china/research/scidb.json diff --git a/firstdata/sources/china/finance/banking/cdb.json b/firstdata/sources/china/finance/banking/cdb.json new file mode 100644 index 0000000..5ff5733 --- /dev/null +++ b/firstdata/sources/china/finance/banking/cdb.json @@ -0,0 +1,65 @@ +{ + "id": "china-cdb", + "name": { + "en": "China Development Bank", + "zh": "国家开发银行" + }, + "description": { + "en": "The China Development Bank (CDB) is China's largest policy bank and development finance institution, directly supervised by the State Council. Established in 1994, it provides medium- and long-term financing for major national strategic projects in infrastructure, basic industries, and pillar industries. CDB publishes annual reports, financial statements, bond issuance data, and statistics on lending to key sectors including transportation, energy, water resources, urban development, and international cooperation.", + "zh": "国家开发银行是中国最大的政策性银行和开发性金融机构,直属国务院监管,成立于1994年,为基础设施、基础产业和支柱产业等国家重大战略项目提供中长期融资。发布年度报告、财务报表、债券发行数据及交通、能源、水利、城镇化建设和国际合作等重点领域贷款统计数据。" + }, + "website": "https://www.cdb.com.cn", + "data_url": "https://www.cdb.com.cn/zwgk/", + "api_url": null, + "authority_level": "government", + "country": "CN", + "domains": [ + "finance", + "banking", + "infrastructure" + ], + "geographic_scope": "national", + "update_frequency": "annual", + "tags": [ + "china", + "development-bank", + "policy-bank", + "infrastructure-finance", + "long-term-lending", + "bond-issuance", + "国家开发银行", + "政策性银行", + "开发性金融", + "基础设施", + "中长期贷款", + "债券", + "能源贷款", + "交通贷款", + "城镇化", + "national-development", + "cdb", + "annual-report" + ], + "data_content": { + "en": [ + "Annual Reports - Full financial statements, business review, capital adequacy, and risk management disclosure", + "Bond Issuances - Domestic and international bond prospectuses, rates, and maturity schedules", + "Sector Lending Data - Loans outstanding by sector: transportation, energy, water, urban, education, agriculture", + "Infrastructure Finance - Financing volume for highways, railways, airports, and urban infrastructure", + "Poverty Alleviation Finance - Targeted lending statistics for poverty reduction and rural revitalization", + "International Cooperation - Overseas lending statistics and development finance for BRI projects", + "Green Finance - Green bonds and environmental lending statistics", + "Information Disclosure (ZWGK) - Regulatory filings, business reports, and governance documents" + ], + "zh": [ + "年度报告 - 完整财务报表、业务回顾、资本充足率及风险管理披露", + "债券发行 - 境内外债券募集说明书、利率及到期安排", + "行业贷款数据 - 按行业划分的贷款余额:交通、能源、水利、城镇、教育、农业", + "基础设施融资 - 公路、铁路、机场及城市基础设施的融资规模", + "脱贫攻坚金融 - 精准扶贫和乡村振兴的专项贷款统计", + "国际合作 - 境外贷款统计数据及一带一路项目开发性融资", + "绿色金融 - 绿色债券和环保领域贷款统计", + "政务公开(ZWGK) - 监管报备、业务报告及公司治理文件" + ] + } +} diff --git a/firstdata/sources/china/finance/banking/eximbank.json b/firstdata/sources/china/finance/banking/eximbank.json new file mode 100644 index 0000000..a4f990f --- /dev/null +++ b/firstdata/sources/china/finance/banking/eximbank.json @@ -0,0 +1,66 @@ +{ + "id": "china-eximbank", + "name": { + "en": "Export-Import Bank of China", + "zh": "中国进出口银行" + }, + "description": { + "en": "The Export-Import Bank of China (EXIM China) is a state-owned policy bank directly under the State Council, established in 1994. It is the sole Chinese government agency bank mandated to provide policy financial services to support China's foreign trade, overseas investment, and international economic cooperation. It publishes annual reports, financial statements, bond issuance data, country loan data, and statistics on export seller's credit, import buyer's credit, and overseas investment loans.", + "zh": "中国进出口银行是直属国务院领导的国家政策性银行,成立于1994年,是唯一被授权承担政策性对外贸易金融业务的政府直属机构,主要支持中国对外贸易、境外投资和国际经济合作。发布年度报告、财务报表、债券发行数据、国别贷款数据及出口买方信贷、进口买方信贷和境外投资贷款统计数据。" + }, + "website": "http://www.eximbank.gov.cn", + "data_url": "http://www.eximbank.gov.cn/cn/index/information/annual/index.html", + "api_url": null, + "authority_level": "government", + "country": "CN", + "domains": [ + "finance", + "trade", + "banking" + ], + "geographic_scope": "national", + "update_frequency": "annual", + "tags": [ + "china", + "policy-bank", + "export-credit", + "import-credit", + "trade-finance", + "foreign-trade", + "overseas-investment", + "belt-and-road", + "中国进出口银行", + "政策性银行", + "出口信贷", + "进口信贷", + "对外贸易", + "境外投资", + "一带一路", + "国际合作", + "债券", + "annual-report", + "development-finance" + ], + "data_content": { + "en": [ + "Annual Reports - Financial statements, business overview, key operational indicators and risk management data", + "Export Seller's Credit - Credit data for Chinese enterprises exporting goods, technology, and services", + "Export Buyer's Credit - Loans to foreign importers purchasing Chinese products and services", + "Overseas Investment Loans - Financing data for Chinese enterprises investing abroad", + "Foreign Government Loans - Concessional loans and preferential export buyer's credit to developing countries", + "Bond Issuances - Domestic and international bond offering data, prospectuses", + "Country Exposure - Loan exposure data by country and region", + "Belt and Road Initiative - Project financing statistics for BRI partner countries" + ], + "zh": [ + "年度报告 - 财务报表、业务概况、主要经营指标及风险管理数据", + "出口卖方信贷 - 中国企业出口商品、技术和服务的信贷数据", + "出口买方信贷 - 向境外进口商提供的采购中国产品和服务的贷款", + "境外投资贷款 - 中国企业境外投资的融资数据", + "对外优惠贷款 - 向发展中国家提供的优惠贷款和优惠出口买方信贷", + "债券发行 - 境内外债券发行数据、募集说明书", + "国别敞口 - 按国家和地区划分的贷款风险敞口数据", + "一带一路 - 共建\"一带一路\"伙伴国家项目融资统计数据" + ] + } +} diff --git a/firstdata/sources/china/governance/cqc.json b/firstdata/sources/china/governance/cqc.json new file mode 100644 index 0000000..7549a0e --- /dev/null +++ b/firstdata/sources/china/governance/cqc.json @@ -0,0 +1,66 @@ +{ + "id": "china-cqc", + "name": { + "en": "China Quality Certification Centre", + "zh": "中国质量认证中心" + }, + "description": { + "en": "China Quality Certification Centre (CQC) is China's largest and most authoritative third-party certification body, authorized by the State Administration for Market Regulation (SAMR). It administers China Compulsory Certification (CCC/3C), voluntary product quality certifications, management system certifications (ISO 9001, ISO 14001, ISO 45001), and publishes public databases of certified products, certification statistics, and certification status queries for domestic and export products.", + "zh": "中国质量认证中心(CQC)是中国最大、最权威的第三方认证机构,由国家市场监督管理总局授权。负责实施中国强制认证(CCC/3C认证)、自愿性产品质量认证、管理体系认证(ISO 9001、ISO 14001、ISO 45001),并发布认证产品公开数据库、认证统计数据及境内外产品认证状态查询服务。" + }, + "website": "https://www.cqc.com.cn", + "data_url": "https://www.cqc.com.cn/", + "api_url": null, + "authority_level": "government", + "country": "CN", + "domains": [ + "standards", + "governance", + "trade" + ], + "geographic_scope": "national", + "update_frequency": "irregular", + "tags": [ + "china", + "certification", + "CCC", + "3C认证", + "quality-certification", + "product-safety", + "iso-9001", + "iso-14001", + "management-system", + "compulsory-certification", + "中国质量认证中心", + "强制认证", + "产品认证", + "质量认证", + "认证查询", + "市场监管", + "合规", + "product-compliance", + "samr" + ], + "data_content": { + "en": [ + "CCC Certificate Database - Public query system for China Compulsory Certification (3C) certificates by product, manufacturer, or certificate number", + "Voluntary Product Certifications - Safety mark (CQC Mark) certificates for non-mandatory product categories", + "Management System Certifications - ISO 9001, 14001, 45001, and other management system certificate status", + "Certification Statistics - Annual certification issuance counts by product category, industry, and region", + "Suspended and Revoked Certificates - Public list of suspended, revoked, or invalid certification records", + "Certified Manufacturer Directory - Database of manufacturers holding valid CQC certifications", + "Green Product Certification - Environmental and energy-efficiency certification data", + "Export Certification Data - Certification data for Chinese products destined for foreign markets" + ], + "zh": [ + "CCC证书数据库 - 按产品、生产商或证书编号查询中国强制认证(3C)证书的公开查询系统", + "自愿性产品认证 - 非强制性产品类别的CQC标志安全认证证书", + "管理体系认证 - ISO 9001、14001、45001及其他管理体系认证状态", + "认证统计数据 - 按产品类别、行业和地区划分的年度认证颁证数量", + "暂停和撤销证书 - 已暂停、撤销或失效认证记录的公开清单", + "获证厂商目录 - 持有有效CQC认证的生产商数据库", + "绿色产品认证 - 环保和节能认证数据", + "出口认证数据 - 中国出口产品认证数据" + ] + } +} diff --git a/firstdata/sources/china/research/ngdc.json b/firstdata/sources/china/research/ngdc.json new file mode 100644 index 0000000..2193705 --- /dev/null +++ b/firstdata/sources/china/research/ngdc.json @@ -0,0 +1,69 @@ +{ + "id": "china-ngdc", + "name": { + "en": "National Genomics Data Center", + "zh": "国家基因组科学数据中心" + }, + "description": { + "en": "The National Genomics Data Center (NGDC) is China's national repository for genomics and bioinformatics data, operated by the Beijing Institute of Genomics, Chinese Academy of Sciences (China National Center for Bioinformation). It hosts the Genome Sequence Archive (GSA), BIG Data Center databases, and provides comprehensive resources for genomic sequences, gene expression, population genetics, and related omics data from Chinese and international research projects.", + "zh": "国家基因组科学数据中心(NGDC)是中国国家级基因组与生物信息学数据仓库,由中国科学院北京基因组研究所(国家生物信息中心)运营。托管基因组序列档案(GSA)和BIG数据中心数据库,为来自中国及国际研究项目的基因组序列、基因表达、群体遗传学及相关组学数据提供全面资源支持。" + }, + "website": "https://ngdc.cncb.ac.cn", + "data_url": "https://ngdc.cncb.ac.cn/gsub/", + "api_url": "https://ngdc.cncb.ac.cn/api/", + "authority_level": "research", + "country": "CN", + "domains": [ + "health", + "science", + "research" + ], + "geographic_scope": "national", + "update_frequency": "irregular", + "tags": [ + "china", + "genomics", + "bioinformatics", + "dna-sequence", + "gene-expression", + "population-genetics", + "omics", + "cas", + "gsa", + "genome-archive", + "国家基因组科学数据中心", + "中国科学院", + "基因组学", + "生物信息学", + "基因序列", + "基因表达", + "群体遗传", + "组学数据", + "生命科学", + "ncbi-equivalent" + ], + "data_content": { + "en": [ + "Genome Sequence Archive (GSA) - Raw sequencing data repository for nucleotide sequences from China and globally", + "BioProject - Project-level metadata for genomic research studies", + "BioSample - Biological sample metadata linked to sequence data", + "Gene Expression Nebulas (GEN) - Single-cell and bulk RNA-seq gene expression datasets", + "Genome Variation Map (GVM) - Human genomic variation data including SNPs and structural variants", + "GWAS Atlas - Curated genome-wide association study data and results", + "Integrated Microbial Genomes - Microbial genome sequences and functional annotation", + "Population Genomics Data - Large-scale human population sequencing datasets from Chinese cohort studies", + "Proteomics and Metabolomics - Mass spectrometry-based protein and metabolite datasets" + ], + "zh": [ + "基因组序列档案(GSA) - 来自中国及全球的核苷酸序列原始数据仓库", + "BioProject - 基因组研究项目的项目级元数据", + "BioSample - 与序列数据关联的生物样本元数据", + "基因表达星云(GEN) - 单细胞和bulk RNA-seq基因表达数据集", + "基因组变异图谱(GVM) - 人类基因组变异数据,包括SNP和结构变异", + "GWAS图集 - 已审编的全基因组关联研究数据及结果", + "整合微生物基因组 - 微生物基因组序列和功能注释", + "群体基因组数据 - 来自中国队列研究的大规模人群测序数据集", + "蛋白质组与代谢组 - 基于质谱的蛋白质和代谢物数据集" + ] + } +} diff --git a/firstdata/sources/china/research/scidb.json b/firstdata/sources/china/research/scidb.json new file mode 100644 index 0000000..836aafd --- /dev/null +++ b/firstdata/sources/china/research/scidb.json @@ -0,0 +1,65 @@ +{ + "id": "china-scidb", + "name": { + "en": "Science Data Bank", + "zh": "科学数据银行" + }, + "description": { + "en": "Science Data Bank (SciDB) is China's national open scientific research data repository, operated by the Computer Network Information Center of the Chinese Academy of Sciences. It provides a platform for researchers to share, publish, and access scientific datasets across disciplines including life sciences, earth sciences, materials science, and environmental science. SciDB supports FAIR data principles and is integrated with major Chinese scientific journals for data-article linking.", + "zh": "科学数据银行(SciDB)是中国国家级开放科研数据仓库,由中国科学院计算机网络信息中心运营,为研究人员提供跨学科科学数据的共享、发布和获取平台,涵盖生命科学、地球科学、材料科学和环境科学等领域。SciDB支持FAIR数据原则,并与国内主要科学期刊深度集成,实现数据与论文的关联发布。" + }, + "website": "https://www.scidb.cn", + "data_url": "https://www.scidb.cn/en/list", + "api_url": null, + "authority_level": "research", + "country": "CN", + "domains": [ + "science", + "research", + "environment" + ], + "geographic_scope": "national", + "update_frequency": "irregular", + "tags": [ + "china", + "scientific-data", + "open-data", + "research-data", + "cas", + "data-repository", + "life-sciences", + "earth-sciences", + "materials-science", + "fair-data", + "科学数据银行", + "中国科学院", + "开放数据", + "科研数据", + "数据共享", + "跨学科", + "数据仓库", + "数据论文" + ], + "data_content": { + "en": [ + "Life Sciences Data - Genomics, proteomics, ecology, and biodiversity datasets", + "Earth Sciences Data - Geophysics, geology, atmospheric science, and oceanography datasets", + "Materials Science Data - Crystal structures, material properties, and experimental datasets", + "Environmental Science Data - Climate, pollution, and ecosystem monitoring datasets", + "Dataset Publications - Peer-reviewed data articles with DOI-assigned datasets", + "Cross-Disciplinary Data - Multi-domain datasets from Chinese research institutions and universities", + "Data Access Metrics - Download statistics, citation counts, and usage analytics for published datasets", + "Data Standards - Metadata schemas, data format standards, and quality documentation" + ], + "zh": [ + "生命科学数据 - 基因组学、蛋白质组学、生态学和生物多样性数据集", + "地球科学数据 - 地球物理、地质、大气科学和海洋学数据集", + "材料科学数据 - 晶体结构、材料性能及实验数据集", + "环境科学数据 - 气候、污染和生态系统监测数据集", + "数据论文发布 - 经同行评审的数据论文及配套DOI数据集", + "跨学科数据 - 来自中国科研机构和高校的多领域数据集", + "数据访问指标 - 已发布数据集的下载量、引用次数和使用分析", + "数据标准 - 元数据模式、数据格式标准及质量文档" + ] + } +} From c961f16f14ff4a21b3a322e5b3c938bf25c3fe0c Mon Sep 17 00:00:00 2001 From: firstdata-dev Date: Tue, 21 Apr 2026 10:08:59 +0800 Subject: [PATCH 2/3] fix: replace duplicate china-cqc (already in PR#164) with china-catarc - Remove china-cqc: already exists in PR #164 branch (cross-batch duplicate) - Add china-catarc: China Automotive Technology and Research Center (CATARC) --- firstdata/sources/china/governance/cqc.json | 66 ------------------- .../sources/china/research/china-catarc.json | 23 +++++++ 2 files changed, 23 insertions(+), 66 deletions(-) delete mode 100644 firstdata/sources/china/governance/cqc.json create mode 100644 firstdata/sources/china/research/china-catarc.json diff --git a/firstdata/sources/china/governance/cqc.json b/firstdata/sources/china/governance/cqc.json deleted file mode 100644 index 7549a0e..0000000 --- a/firstdata/sources/china/governance/cqc.json +++ /dev/null @@ -1,66 +0,0 @@ -{ - "id": "china-cqc", - "name": { - "en": "China Quality Certification Centre", - "zh": "中国质量认证中心" - }, - "description": { - "en": "China Quality Certification Centre (CQC) is China's largest and most authoritative third-party certification body, authorized by the State Administration for Market Regulation (SAMR). It administers China Compulsory Certification (CCC/3C), voluntary product quality certifications, management system certifications (ISO 9001, ISO 14001, ISO 45001), and publishes public databases of certified products, certification statistics, and certification status queries for domestic and export products.", - "zh": "中国质量认证中心(CQC)是中国最大、最权威的第三方认证机构,由国家市场监督管理总局授权。负责实施中国强制认证(CCC/3C认证)、自愿性产品质量认证、管理体系认证(ISO 9001、ISO 14001、ISO 45001),并发布认证产品公开数据库、认证统计数据及境内外产品认证状态查询服务。" - }, - "website": "https://www.cqc.com.cn", - "data_url": "https://www.cqc.com.cn/", - "api_url": null, - "authority_level": "government", - "country": "CN", - "domains": [ - "standards", - "governance", - "trade" - ], - "geographic_scope": "national", - "update_frequency": "irregular", - "tags": [ - "china", - "certification", - "CCC", - "3C认证", - "quality-certification", - "product-safety", - "iso-9001", - "iso-14001", - "management-system", - "compulsory-certification", - "中国质量认证中心", - "强制认证", - "产品认证", - "质量认证", - "认证查询", - "市场监管", - "合规", - "product-compliance", - "samr" - ], - "data_content": { - "en": [ - "CCC Certificate Database - Public query system for China Compulsory Certification (3C) certificates by product, manufacturer, or certificate number", - "Voluntary Product Certifications - Safety mark (CQC Mark) certificates for non-mandatory product categories", - "Management System Certifications - ISO 9001, 14001, 45001, and other management system certificate status", - "Certification Statistics - Annual certification issuance counts by product category, industry, and region", - "Suspended and Revoked Certificates - Public list of suspended, revoked, or invalid certification records", - "Certified Manufacturer Directory - Database of manufacturers holding valid CQC certifications", - "Green Product Certification - Environmental and energy-efficiency certification data", - "Export Certification Data - Certification data for Chinese products destined for foreign markets" - ], - "zh": [ - "CCC证书数据库 - 按产品、生产商或证书编号查询中国强制认证(3C)证书的公开查询系统", - "自愿性产品认证 - 非强制性产品类别的CQC标志安全认证证书", - "管理体系认证 - ISO 9001、14001、45001及其他管理体系认证状态", - "认证统计数据 - 按产品类别、行业和地区划分的年度认证颁证数量", - "暂停和撤销证书 - 已暂停、撤销或失效认证记录的公开清单", - "获证厂商目录 - 持有有效CQC认证的生产商数据库", - "绿色产品认证 - 环保和节能认证数据", - "出口认证数据 - 中国出口产品认证数据" - ] - } -} diff --git a/firstdata/sources/china/research/china-catarc.json b/firstdata/sources/china/research/china-catarc.json new file mode 100644 index 0000000..0beb56a --- /dev/null +++ b/firstdata/sources/china/research/china-catarc.json @@ -0,0 +1,23 @@ +{ + "id": "china-catarc", + "name": { + "en": "China Automotive Technology and Research Center", + "zh": "中国汽车技术研究中心" + }, + "description": { + "en": "The China Automotive Technology and Research Center (CATARC) is a national-level research institution under SASAC, providing automotive industry testing, certification, standards development, and policy research. It publishes vehicle sales data, new energy vehicle statistics, and automotive safety reports.", + "zh": "中国汽车技术研究中心(中汽中心)是国资委直属的国家级研究机构,提供汽车行业测试、认证、标准制定和政策研究服务。发布汽车销量数据、新能源汽车统计和汽车安全报告。" + }, + "data_content": { + "en": ["vehicle sales statistics", "new energy vehicle data", "automotive safety reports", "emission standards data", "vehicle certification records"], + "zh": ["汽车销量统计", "新能源汽车数据", "汽车安全报告", "排放标准数据", "车辆认证记录"] + }, + "country": "CN", + "authority_level": "research", + "geographic_scope": "national", + "website": "https://www.catarc.ac.cn", + "data_url": "https://www.catarc.ac.cn", + "domains": ["transportation", "manufacturing"], + "tags": ["automotive", "vehicles", "new-energy", "safety", "certification", "sasac"], + "update_frequency": "monthly" +} From ee0d6922b2dea415918b9f9ce91adada5320c186 Mon Sep 17 00:00:00 2001 From: firstdata-dev Date: Tue, 21 Apr 2026 10:09:51 +0800 Subject: [PATCH 3/3] =?UTF-8?q?fix:=20correct=20china-cdb=20data=5Furl=20(?= =?UTF-8?q?deep=20path=20404=E2=86=92root)?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- firstdata/sources/china/finance/banking/cdb.json | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/firstdata/sources/china/finance/banking/cdb.json b/firstdata/sources/china/finance/banking/cdb.json index 5ff5733..bd6ea53 100644 --- a/firstdata/sources/china/finance/banking/cdb.json +++ b/firstdata/sources/china/finance/banking/cdb.json @@ -9,7 +9,7 @@ "zh": "国家开发银行是中国最大的政策性银行和开发性金融机构,直属国务院监管,成立于1994年,为基础设施、基础产业和支柱产业等国家重大战略项目提供中长期融资。发布年度报告、财务报表、债券发行数据及交通、能源、水利、城镇化建设和国际合作等重点领域贷款统计数据。" }, "website": "https://www.cdb.com.cn", - "data_url": "https://www.cdb.com.cn/zwgk/", + "data_url": "https://www.cdb.com.cn", "api_url": null, "authority_level": "government", "country": "CN",