中国四级城市联动数据,包含港澳台,内含json , sql , python 脚本

python脚本:

复制代码
import json
from pypinyin import lazy_pinyin, Style

def get_pinyin(text):
    full = ''.join(lazy_pinyin(text, style=Style.TONE3))
    short = ''.join([p[0] for p in lazy_pinyin(text, style=Style.TONE3)])
    return full, short

def escape_sql(s):
    return s.replace("'", "''")

def main():
    with open('pcas-code.json', 'r', encoding='utf-8') as f:
        provinces = json.load(f)

    records = []
    id_counter = 1
    province_id_map = {}
    city_id_map = {}
    district_id_map = {}

    # === 构建所有记录(四级)===
    for province in provinces:
        p_code = province['code']
        p_name = province['name']
        pf, ps = get_pinyin(p_name)
        records.append({
            'id': id_counter,
            'name': p_name,
            'province': p_name,
            'code': p_code,
            'level': 1,
            'parent_id': 0,
            'pinyin': pf,
            'short_pinyin': ps
        })
        province_id_map[p_code] = id_counter
        id_counter += 1

        for city in province.get('children', []):
            c_code = city['code']
            c_name = city['name']
            cf, cs = get_pinyin(c_name)
            records.append({
                'id': id_counter,
                'name': c_name,
                'province': p_name,
                'code': c_code,
                'level': 2,
                'parent_id': province_id_map[p_code],
                'pinyin': cf,
                'short_pinyin': cs
            })
            city_id_map[c_code] = id_counter
            id_counter += 1

            for district in city.get('children', []):
                d_code = district['code']
                d_name = district['name']
                df, ds = get_pinyin(d_name)
                records.append({
                    'id': id_counter,
                    'name': d_name,
                    'province': p_name,
                    'code': d_code,
                    'level': 3,
                    'parent_id': city_id_map[c_code],
                    'pinyin': df,
                    'short_pinyin': ds
                })
                district_id_map[d_code] = id_counter
                id_counter += 1

                for town in district.get('children', []):
                    t_code = town['code']
                    t_name = town['name']
                    tf, ts = get_pinyin(t_name)
                    records.append({
                        'id': id_counter,
                        'name': t_name,
                        'province': p_name,
                        'code': t_code,
                        'level': 4,
                        'parent_id': district_id_map[d_code],
                        'pinyin': tf,
                        'short_pinyin': ts
                    })
                    id_counter += 1

    print(f"📊 共生成 {len(records)} 条记录(省+市+区县+乡镇)")

    # === 分批写入 SQL ===
    batch_size = 1000
    total_batches = (len(records) + batch_size - 1) // batch_size

    with open('insert_city_batch_1000.sql', 'w', encoding='utf-8') as f:
        f.write("-- 四级行政区划数据(省/市/区县/乡镇)\n")
        f.write("-- 每批 1000 条,自动分批插入\n")
        f.write("SET foreign_key_checks = 0;\n")
        f.write("SET sql_log_bin = 0; -- 可选:跳过 binlog(如需)\n\n")

        for i in range(0, len(records), batch_size):
            batch = records[i:i + batch_size]
            f.write("INSERT INTO `city` (`id`, `name`, `province`, `code`, `level`, `parent_id`, `pinyin`, `short_pinyin`, `sort`, `del_flag`, `create_time`, `update_time`) VALUES\n")
            lines = []
            for r in batch:
                parent_str = 'NULL' if r['parent_id'] is None else str(r['parent_id'])
                name = escape_sql(r['name'])
                province = escape_sql(r['province'])
                line = f"({r['id']}, '{name}', '{province}', '{r['code']}', {r['level']}, {parent_str}, '{r['pinyin']}', '{r['short_pinyin']}', 0, '0', NOW(), NOW())"
                lines.append(line)
            f.write(",\n".join(lines))
            f.write(";\n\n")

        f.write("SET foreign_key_checks = 1;\n")
        f.write("-- ✅ 导入完成\n")

    print(f"✅ 已生成 {total_batches} 个批次")
    print("📄 输出文件:insert_city_batch_1000.sql")

if __name__ == '__main__':
    main()
相关推荐
BoBoZz192 小时前
Curvatures 曲率的计算、边缘曲率的调整以及曲率、颜色的映射
python·vtk·图形渲染·图形处理
思成不止于此2 小时前
【MySQL 零基础入门】MySQL 约束精讲(一):基础约束篇
数据库·笔记·sql·学习·mysql
少吃零食多运动2 小时前
【Jupyter notebook修改工作目录】
python·jupyter
Swizard2 小时前
别买树莓派了!3步教你在安卓手机上跑通 CPython + PaddleOCR,打造随身 AI 识别终端
python·ai·移动开发
ActionTech3 小时前
SCALE | SQLFlash 在 SQL 优化维度上的表现评估
数据库·sql
weixin_421585013 小时前
PYTHON 迭代器1 - PEP-255
开发语言·python
hxxjxw4 小时前
Pytorch分布式训练/多卡训练(六) —— Expert Parallelism (MoE的特殊策略)
人工智能·pytorch·python
dagouaofei4 小时前
PPT AI生成实测报告:哪些工具值得长期使用?
人工智能·python·powerpoint