中国四级城市联动数据,包含港澳台,内含json , sql , python 脚本

python脚本:

复制代码
import json
from pypinyin import lazy_pinyin, Style

def get_pinyin(text):
    full = ''.join(lazy_pinyin(text, style=Style.TONE3))
    short = ''.join([p[0] for p in lazy_pinyin(text, style=Style.TONE3)])
    return full, short

def escape_sql(s):
    return s.replace("'", "''")

def main():
    with open('pcas-code.json', 'r', encoding='utf-8') as f:
        provinces = json.load(f)

    records = []
    id_counter = 1
    province_id_map = {}
    city_id_map = {}
    district_id_map = {}

    # === 构建所有记录(四级)===
    for province in provinces:
        p_code = province['code']
        p_name = province['name']
        pf, ps = get_pinyin(p_name)
        records.append({
            'id': id_counter,
            'name': p_name,
            'province': p_name,
            'code': p_code,
            'level': 1,
            'parent_id': 0,
            'pinyin': pf,
            'short_pinyin': ps
        })
        province_id_map[p_code] = id_counter
        id_counter += 1

        for city in province.get('children', []):
            c_code = city['code']
            c_name = city['name']
            cf, cs = get_pinyin(c_name)
            records.append({
                'id': id_counter,
                'name': c_name,
                'province': p_name,
                'code': c_code,
                'level': 2,
                'parent_id': province_id_map[p_code],
                'pinyin': cf,
                'short_pinyin': cs
            })
            city_id_map[c_code] = id_counter
            id_counter += 1

            for district in city.get('children', []):
                d_code = district['code']
                d_name = district['name']
                df, ds = get_pinyin(d_name)
                records.append({
                    'id': id_counter,
                    'name': d_name,
                    'province': p_name,
                    'code': d_code,
                    'level': 3,
                    'parent_id': city_id_map[c_code],
                    'pinyin': df,
                    'short_pinyin': ds
                })
                district_id_map[d_code] = id_counter
                id_counter += 1

                for town in district.get('children', []):
                    t_code = town['code']
                    t_name = town['name']
                    tf, ts = get_pinyin(t_name)
                    records.append({
                        'id': id_counter,
                        'name': t_name,
                        'province': p_name,
                        'code': t_code,
                        'level': 4,
                        'parent_id': district_id_map[d_code],
                        'pinyin': tf,
                        'short_pinyin': ts
                    })
                    id_counter += 1

    print(f"📊 共生成 {len(records)} 条记录(省+市+区县+乡镇)")

    # === 分批写入 SQL ===
    batch_size = 1000
    total_batches = (len(records) + batch_size - 1) // batch_size

    with open('insert_city_batch_1000.sql', 'w', encoding='utf-8') as f:
        f.write("-- 四级行政区划数据(省/市/区县/乡镇)\n")
        f.write("-- 每批 1000 条,自动分批插入\n")
        f.write("SET foreign_key_checks = 0;\n")
        f.write("SET sql_log_bin = 0; -- 可选:跳过 binlog(如需)\n\n")

        for i in range(0, len(records), batch_size):
            batch = records[i:i + batch_size]
            f.write("INSERT INTO `city` (`id`, `name`, `province`, `code`, `level`, `parent_id`, `pinyin`, `short_pinyin`, `sort`, `del_flag`, `create_time`, `update_time`) VALUES\n")
            lines = []
            for r in batch:
                parent_str = 'NULL' if r['parent_id'] is None else str(r['parent_id'])
                name = escape_sql(r['name'])
                province = escape_sql(r['province'])
                line = f"({r['id']}, '{name}', '{province}', '{r['code']}', {r['level']}, {parent_str}, '{r['pinyin']}', '{r['short_pinyin']}', 0, '0', NOW(), NOW())"
                lines.append(line)
            f.write(",\n".join(lines))
            f.write(";\n\n")

        f.write("SET foreign_key_checks = 1;\n")
        f.write("-- ✅ 导入完成\n")

    print(f"✅ 已生成 {total_batches} 个批次")
    print("📄 输出文件:insert_city_batch_1000.sql")

if __name__ == '__main__':
    main()
相关推荐
小郑加油10 分钟前
python学习Day11:认识与创建CSV文件
开发语言·python·学习
Pkmer12 分钟前
Java程序员大战Python面向对象
python·ai编程
小龙报18 分钟前
【Coze-AI智能体平台】低代码省时高效:Coze 应用开发全流程指南
java·人工智能·python·深度学习·低代码·chatgpt·交互
技术钱20 分钟前
LCEL表达式与Runnable可运行协议
python
Echo_NGC223723 分钟前
【论文解读】Attention Is All You Need —— AI 时代的“开山之作“,经典中的经典(transformer小白导读)
人工智能·python·深度学习·神经网络·机器学习·conda·transformer
鸟儿不吃草1 小时前
安卓实现左右布局聊天界面
android·开发语言·python
mr_LuoWei20091 小时前
类似CASS for autoCAD的平基土石方三维计算工具基本完成
python·三维地形图
alwaysrun1 小时前
Python自动提取邮件订阅链接并解析
python·url·邮件·ai提取
何中应1 小时前
Conda安装&使用
python·conda·python3.11