Files
MoFin/venv/lib/python3.12/site-packages/akshare/stock/stock_industry_cninfo.py
T
知微 fa45d8aa5f fix: 小果地址统一node122(兼容LAN+EasyTier)
- health_checklist.json: 192.168.1.122→node122
- ocr_client.py: docstring IP→node122
- docs/market-data-requirements.md: IP→node122
- 所有API调用通过ProxyHandler({})绕过系统代理
  Privoxy对node122:18003返回500,直连正常
2026-06-30 02:56:35 +08:00

184 lines
6.4 KiB
Python

# -*- coding:utf-8 -*-
# !/usr/bin/env python
"""
Date: 2024/5/19 18:34
Desc: 巨潮资讯-行业分类数据
https://webapi.cninfo.com.cn/#/apiDoc
https://webapi.cninfo.com.cn/api/stock/p_stock2110
"""
import numpy as np
import pandas as pd
import requests
import py_mini_racer
from akshare.datasets import get_ths_js
def _get_file_content_ths(file: str = "cninfo.js") -> str:
"""
获取 JS 文件的内容
:param file: JS 文件名
:type file: str
:return: 文件内容
:rtype: str
"""
setting_file_path = get_ths_js(file)
with open(setting_file_path, encoding="utf-8") as f:
file_data = f.read()
return file_data
def stock_industry_category_cninfo(symbol: str = "巨潮行业分类标准") -> pd.DataFrame:
"""
巨潮资讯-行业分类数据
https://webapi.cninfo.com.cn/#/apiDoc
查询 p_public0002 接口
:param symbol: 行业类型; choice of {"证监会行业分类标准", "巨潮行业分类标准", "申银万国行业分类标准",
"新财富行业分类标准", "国资委行业分类标准", "巨潮产业细分标准", "天相行业分类标准", "全球行业分类标准"}
:type symbol: str
:return: 行业分类数据
:rtype: pandas.DataFrame
"""
symbol_map = {
"证监会行业分类标准": "008001",
"巨潮行业分类标准": "008002",
"申银万国行业分类标准": "008003",
"新财富行业分类标准": "008004",
"国资委行业分类标准": "008005",
"巨潮产业细分标准": "008006",
"天相行业分类标准": "008007",
"全球行业分类标准": "008008",
}
url = "https://webapi.cninfo.com.cn/api/stock/p_public0002"
params = {"indcode": "", "indtype": symbol_map[symbol], "format": "json"}
js_code = py_mini_racer.MiniRacer()
js_content = _get_file_content_ths("cninfo.js")
js_code.eval(js_content)
mcode = js_code.call("getResCode1")
headers = {
"Accept": "*/*",
"Accept-Encoding": "gzip, deflate",
"Accept-Language": "zh-CN,zh;q=0.9,en;q=0.8",
"Cache-Control": "no-cache",
"Content-Length": "0",
"Host": "webapi.cninfo.com.cn",
"Accept-Enckey": mcode,
"Origin": "https://webapi.cninfo.com.cn",
"Pragma": "no-cache",
"Proxy-Connection": "keep-alive",
"Referer": "https://webapi.cninfo.com.cn/",
"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) "
"Chrome/93.0.4577.63 Safari/537.36",
"X-Requested-With": "XMLHttpRequest",
}
r = requests.get(url, params=params, headers=headers)
data_json = r.json()
temp_df = pd.DataFrame(data_json["records"])
cols_map = {
"PARENTCODE": "父类编码",
"SORTCODE": "类目编码",
"SORTNAME": "类目名称",
"F001V": "类目名称英文",
"F002D": "终止日期",
"F003V": "行业类型编码",
"F004V": "行业类型",
}
temp_df.rename(columns=cols_map, inplace=True)
# 行业按分级排序
tmp = temp_df[["类目编码"]].copy()
tmp["len"] = temp_df["类目编码"].str.len()
tmp["Level"] = 0
g = tmp.groupby("len")
level = 0
for k in g.groups.keys():
temp_df.loc[temp_df["类目编码"].isin(g.get_group(k)["类目编码"]), "Level"] = (
level
)
level += 1
temp_df["Level"] = temp_df["Level"].astype(int)
temp_df.rename(columns={"Level": "分级"}, inplace=True)
temp_df["终止日期"] = pd.to_datetime(temp_df["终止日期"], errors="coerce").dt.date
return temp_df
def stock_industry_change_cninfo(
symbol: str = "002594",
start_date: str = "20091227",
end_date: str = "20220713",
) -> pd.DataFrame:
"""
巨潮资讯-上市公司行业归属的变动情况
https://webapi.cninfo.com.cn/#/apiDoc
查询 p_stock2110 接口
:param symbol: 股票代码
:type symbol: str
:param start_date: 开始变动日期
:type start_date: str
:param end_date: 结束变动日期
:type end_date: str
:return: 行业归属的变动情况
:rtype: pandas.DataFrame
"""
url = "https://webapi.cninfo.com.cn/api/stock/p_stock2110"
params = {
"scode": symbol,
"sdate": "-".join([start_date[:4], start_date[4:6], start_date[6:]]),
"edate": "-".join([end_date[:4], end_date[4:6], end_date[6:]]),
}
js_code = py_mini_racer.MiniRacer()
js_content = _get_file_content_ths("cninfo.js")
js_code.eval(js_content)
mcode = js_code.call("getResCode1")
headers = {
"Accept": "*/*",
"Accept-Encoding": "gzip, deflate",
"Accept-Language": "zh-CN,zh;q=0.9,en;q=0.8",
"Cache-Control": "no-cache",
"Content-Length": "0",
"Host": "webapi.cninfo.com.cn",
"Accept-Enckey": mcode,
"Origin": "https://webapi.cninfo.com.cn",
"Pragma": "no-cache",
"Proxy-Connection": "keep-alive",
"Referer": "https://webapi.cninfo.com.cn/",
"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) "
"Chrome/93.0.4577.63 Safari/537.36",
"X-Requested-With": "XMLHttpRequest",
}
r = requests.post(url, params=params, headers=headers)
data_json = r.json()
temp_df = pd.DataFrame(data_json["records"])
cols_map = {
"ORGNAME": "机构名称",
"SECCODE": "证券代码",
"SECNAME": "新证券简称",
"VARYDATE": "变更日期",
"F001V": "分类标准编码",
"F002V": "分类标准",
"F003V": "行业编码",
"F004V": "行业门类",
"F005V": "行业次类",
"F006V": "行业大类",
"F007V": "行业中类",
"F008C": "最新记录标识",
}
ignore_cols = ["最新记录标识"]
temp_df.rename(columns=cols_map, inplace=True)
temp_df.fillna(np.nan, inplace=True)
temp_df["变更日期"] = pd.to_datetime(temp_df["变更日期"], errors="coerce").dt.date
data_df = temp_df[[c for c in temp_df.columns if c not in ignore_cols]]
return data_df
if __name__ == "__main__":
stock_industry_category_cninfo_df = stock_industry_category_cninfo(
symbol="巨潮行业分类标准"
)
print(stock_industry_category_cninfo_df)
stock_industry_change_cninfo_df = stock_industry_change_cninfo(
symbol="002594", start_date="20091227", end_date="20220708"
)
print(stock_industry_change_cninfo_df)