中国四级城市联动数据,包含港澳台,内含json , sql , python 脚本

python脚本:

复制代码
import json
from pypinyin import lazy_pinyin, Style

def get_pinyin(text):
    full = ''.join(lazy_pinyin(text, style=Style.TONE3))
    short = ''.join([p[0] for p in lazy_pinyin(text, style=Style.TONE3)])
    return full, short

def escape_sql(s):
    return s.replace("'", "''")

def main():
    with open('pcas-code.json', 'r', encoding='utf-8') as f:
        provinces = json.load(f)

    records = []
    id_counter = 1
    province_id_map = {}
    city_id_map = {}
    district_id_map = {}

    # === 构建所有记录(四级)===
    for province in provinces:
        p_code = province['code']
        p_name = province['name']
        pf, ps = get_pinyin(p_name)
        records.append({
            'id': id_counter,
            'name': p_name,
            'province': p_name,
            'code': p_code,
            'level': 1,
            'parent_id': 0,
            'pinyin': pf,
            'short_pinyin': ps
        })
        province_id_map[p_code] = id_counter
        id_counter += 1

        for city in province.get('children', []):
            c_code = city['code']
            c_name = city['name']
            cf, cs = get_pinyin(c_name)
            records.append({
                'id': id_counter,
                'name': c_name,
                'province': p_name,
                'code': c_code,
                'level': 2,
                'parent_id': province_id_map[p_code],
                'pinyin': cf,
                'short_pinyin': cs
            })
            city_id_map[c_code] = id_counter
            id_counter += 1

            for district in city.get('children', []):
                d_code = district['code']
                d_name = district['name']
                df, ds = get_pinyin(d_name)
                records.append({
                    'id': id_counter,
                    'name': d_name,
                    'province': p_name,
                    'code': d_code,
                    'level': 3,
                    'parent_id': city_id_map[c_code],
                    'pinyin': df,
                    'short_pinyin': ds
                })
                district_id_map[d_code] = id_counter
                id_counter += 1

                for town in district.get('children', []):
                    t_code = town['code']
                    t_name = town['name']
                    tf, ts = get_pinyin(t_name)
                    records.append({
                        'id': id_counter,
                        'name': t_name,
                        'province': p_name,
                        'code': t_code,
                        'level': 4,
                        'parent_id': district_id_map[d_code],
                        'pinyin': tf,
                        'short_pinyin': ts
                    })
                    id_counter += 1

    print(f"📊 共生成 {len(records)} 条记录(省+市+区县+乡镇)")

    # === 分批写入 SQL ===
    batch_size = 1000
    total_batches = (len(records) + batch_size - 1) // batch_size

    with open('insert_city_batch_1000.sql', 'w', encoding='utf-8') as f:
        f.write("-- 四级行政区划数据(省/市/区县/乡镇)\n")
        f.write("-- 每批 1000 条,自动分批插入\n")
        f.write("SET foreign_key_checks = 0;\n")
        f.write("SET sql_log_bin = 0; -- 可选:跳过 binlog(如需)\n\n")

        for i in range(0, len(records), batch_size):
            batch = records[i:i + batch_size]
            f.write("INSERT INTO `city` (`id`, `name`, `province`, `code`, `level`, `parent_id`, `pinyin`, `short_pinyin`, `sort`, `del_flag`, `create_time`, `update_time`) VALUES\n")
            lines = []
            for r in batch:
                parent_str = 'NULL' if r['parent_id'] is None else str(r['parent_id'])
                name = escape_sql(r['name'])
                province = escape_sql(r['province'])
                line = f"({r['id']}, '{name}', '{province}', '{r['code']}', {r['level']}, {parent_str}, '{r['pinyin']}', '{r['short_pinyin']}', 0, '0', NOW(), NOW())"
                lines.append(line)
            f.write(",\n".join(lines))
            f.write(";\n\n")

        f.write("SET foreign_key_checks = 1;\n")
        f.write("-- ✅ 导入完成\n")

    print(f"✅ 已生成 {total_batches} 个批次")
    print("📄 输出文件:insert_city_batch_1000.sql")

if __name__ == '__main__':
    main()
相关推荐
2501_945423541 小时前
用Matplotlib绘制专业图表:从基础到高级
jvm·数据库·python
2301_793804691 小时前
使用Python处理计算机图形学(PIL/Pillow)
jvm·数据库·python
qqxhb7 小时前
11|结构化输出:为什么 JSON 能让系统更稳定
json·ai编程·结构化·规范模板
吴佳浩7 小时前
GPU 编号进阶:CUDA\_VISIBLE\_DEVICES、多进程与容器化陷阱
人工智能·pytorch·python
全栈凯哥8 小时前
18.Python中的导入类完全指南
python
sunwenjian8868 小时前
Java进阶——IO 流
java·开发语言·python
guts3509 小时前
图像篡改数据集下载:COVERAGE、CASIA
python·数据集
森林猿9 小时前
java-modbus-读取-modbus4j
java·网络·python
2401_879693879 小时前
将Python Web应用部署到服务器(Docker + Nginx)
jvm·数据库·python
reembarkation9 小时前
光标在a-select,鼠标已经移出,下拉框跟随页面滚动
java·数据库·sql