Files
MoFin/venv/lib/python3.12/site-packages/akshare/event/migration.py
T
知微 fa45d8aa5f fix: 小果地址统一node122(兼容LAN+EasyTier)
- health_checklist.json: 192.168.1.122→node122
- ocr_client.py: docstring IP→node122
- docs/market-data-requirements.md: IP→node122
- 所有API调用通过ProxyHandler({})绕过系统代理
  Privoxy对node122:18003返回500,直连正常
2026-06-30 02:56:35 +08:00

105 lines
3.7 KiB
Python

#!/usr/bin/env python
# -*- coding:utf-8 -*-
"""
Date: 2024/5/12 22:30
Desc: 百度地图慧眼-百度迁徙数据
"""
import json
import pandas as pd
import requests
from akshare.event.cons import province_dict, city_dict
def migration_area_baidu(
area: str = "重庆市", indicator: str = "move_in", date: str = "20230922"
) -> pd.DataFrame:
"""
百度地图慧眼-百度迁徙-XXX迁入地详情
百度地图慧眼-百度迁徙-XXX迁出地详情
以上展示 top100 结果,如不够 100 则展示全部
迁入来源地比例: 从 xx 地迁入到当前区域的人数与当前区域迁入总人口的比值
迁出目的地比例: 从当前区域迁出到 xx 的人口与从当前区域迁出总人口的比值
https://qianxi.baidu.com/?from=shoubai#city=0
:param area: 可以输入 省份 或者 具体城市 但是需要用全称
:type area: str
:param indicator: move_in 迁入 move_out 迁出
:type indicator: str
:param date: 查询的日期 20200101 以后的时间
:type date: str
:return: 迁入地详情/迁出地详情的前 50 个
:rtype: pandas.DataFrame
"""
city_dict.update(province_dict)
inner_dict = dict(zip(city_dict.values(), city_dict.keys()))
if inner_dict[area] in province_dict.keys():
dt_flag = "province"
else:
dt_flag = "city"
url = "https://huiyan.baidu.com/migration/cityrank.jsonp"
params = {
"dt": dt_flag,
"id": inner_dict[area],
"type": indicator,
"date": date,
}
r = requests.get(url, params=params)
data_text = r.text[r.text.find("({") + 1 : r.text.rfind(");")]
data_json = json.loads(data_text)
temp_df = pd.DataFrame(data_json["data"]["list"])
temp_df["value"] = pd.to_numeric(temp_df["value"], errors="coerce")
return temp_df
def migration_scale_baidu(
area: str = "广州市",
indicator: str = "move_in",
) -> pd.DataFrame:
"""
百度地图慧眼-百度迁徙-迁徙规模
迁徙规模指数:反映迁入或迁出人口规模,城市间可横向对比城市迁徙边界采用该城市行政区划,包含该城市管辖的区、县、乡、村
https://qianxi.baidu.com/?from=shoubai#city=0
:param area: 可以输入 省份 或者 具体城市 但是需要用全称
:type area: str
:param indicator: move_in 迁入 move_out 迁出
:type indicator: str
:return: 时间序列的迁徙规模指数
:rtype: pandas.DataFrame
"""
city_dict.update(province_dict)
inner_dict = dict(zip(city_dict.values(), city_dict.keys()))
if inner_dict[area] in province_dict.keys():
dt_flag = "province"
else:
dt_flag = "city"
url = "https://huiyan.baidu.com/migration/historycurve.jsonp"
params = {
"dt": dt_flag,
"id": inner_dict[area],
"type": indicator,
}
r = requests.get(url, params=params)
json_data = json.loads(r.text[r.text.find("({") + 1 : r.text.rfind(");")])
temp_df = pd.DataFrame.from_dict(json_data["data"]["list"], orient="index")
temp_df.index = pd.to_datetime(temp_df.index)
temp_df.reset_index(inplace=True)
temp_df.columns = ["日期", "迁徙规模指数"]
temp_df["日期"] = pd.to_datetime(temp_df["日期"], errors="coerce").dt.date
temp_df["迁徙规模指数"] = pd.to_numeric(temp_df["迁徙规模指数"], errors="coerce")
return temp_df
if __name__ == "__main__":
migration_area_baidu_df = migration_area_baidu(
area="杭州市", indicator="move_out", date="20240401"
)
print(migration_area_baidu_df)
migration_scale_baidu_df = migration_scale_baidu(
area="广州市",
indicator="move_in",
)
print(migration_scale_baidu_df)