Python獲取全國所有的省、市、縣、鎮、村

阿新 • • 發佈：2019-01-31

#!/usr/bin/python3
# -*- coding: utf-8 -*-
# author=He

"""
通過國家統計局資料
獲取中國所有城市列表
"""
import sys
import os
import re
from urllib import request
from bs4 import BeautifulSoup
sys.path.insert(0, os.path.dirname(os.path.abspath(__file__)))
url = 'http://www.stats.gov.cn/tjsj/tjbz/tjyqhdmhcxhfdm/2016/'
header = {
    'Cookie' 
: 'AD_RS_COOKIE=20080917',
    'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) \ AppleWeb\Kit/537.36 (KHTML, like Gecko)\ '
                  'Chrome/58.0.3029.110 Safari/537.36'}


class GetHttp:
    def __init__(self, url, headers=None, charset='utf8'):
        if headers is None:
            headers = {}
        self._response = '' 

        try:
            print(url)
            self._response = request.urlopen(request.Request(url=url, headers=headers))
        except Exception as e:
            print(e)
        self._c = charset

    @property
    def text(self):
        try:
            return self._response.read().decode(self._c)
        except 
 Exception as e:
            print(e)
            return ''


def provincetr(u, he, lists):
    # 獲取全國省份和直轄市
    t = GetHttp(u, he, 'gbk').text
    if t:
        soup = BeautifulSoup(t, 'html.parser')
        for i in soup.find_all(attrs={'class': 'provincetr'}):
            for a in i.find_all('a'):
                id = re.sub("\D", "", a.get('href'))
                lists[id] = {'id': id, 'name': a.text, 'pid': '0', 'pid1': '0', 'pid2': '0', 'pid3': '0', 'pid4': '0',
                             'code': id}
                # time.sleep(1 / 10)
    return lists


def citytr(u, he, lists):
    # 獲取省下級市
    l = lists.copy()
    for i in l:
        t = GetHttp(u+i+'.html', he, 'gbk').text
        if not t:
            continue
        soup = BeautifulSoup(t, 'html.parser')
        for v in soup.find_all(attrs={'class': 'citytr'}):
            id = str(v.find_all('td')[0].text)
            if id[0:4] not in lists.keys():
                lists[id[0:4]] = {'id': id[0:4], 'name': str(v.find_all('td')[1].text),
                                  'pid': '0', 'pid1': i, 'pid2': '0', 'pid3': '0', 'pid4': '0', 'code': id}
    return lists


def countytr(u, he, lists):
    # 獲取市下級縣
    l = lists.copy()
    a = {}
    for i in l:
        t = GetHttp(u+i[0:2]+'/'+i+'.html', he, 'gbk').text
        if not t:
            continue
        soup = BeautifulSoup(t, 'html.parser')
        for v in soup.find_all(attrs={'class': 'countytr'}):
            id = str(v.find_all('td')[0].text)
            if id[0:6] not in lists.keys():
                lists[id[0:6]] = {'id': id[0:6], 'name': str(v.find_all('td')[1].text),
                                  'pid': '0', 'pid1': l[i]['pid1'], 'pid2': i, 'pid3': '0', 'pid4': '0', 'code': id}
    return lists


def towntr(u, he, lists):
    # 縣下級鎮
    l = lists.copy()
    for i in l:
        t = GetHttp(u+i[0:2]+'/'+i[2:4]+'/'+i+'.html', he, 'gbk').text
        if not t:
            continue
        soup = BeautifulSoup(t, 'html.parser')
        for v in soup.find_all(attrs={'class': 'towntr'}):
            id = str(v.find_all('td')[0].text)
            if id[0:9] not in lists.keys():
                lists[id[0:9]] = {'id': id[0:9], 'name': str(v.find_all('td')[1].text), 'pid': '0',
                                  'pid1': l[i]['pid1'], 'pid2': l[i]['pid2'], 'pid3': i, 'pid4': '0', 'code': id}
    return lists


def villagetr(u, he, lists):
    # 鎮下級村
    l = lists.copy()
    for i in l:
        t = GetHttp(u+i[0:2]+'/'+i[2:4]+'/'+i[4:6]+'/'+i+'.html', he, 'gbk').text
        if not t:
            continue
        soup = BeautifulSoup(t, 'html.parser')
        for v in soup.find_all(attrs={'class': 'villagetr'}):
            id = str(v.find_all('td')[0].text)
            if id[0:12] not in lists.keys():
                lists[id[0:12]] = {'id': id[0:12], 'name': str(v.find_all('td')[1].text), 'pid': '0',
                                   'pid1': l[i]['pid1'], 'pid2': l[i]['pid2'], 'pid3': l[i]['pid2'], 'pid4': i,
                                   'code': id}
    return lists
p = provincetr(u=url, he=header, lists={})
print('省')
c = citytr(u=url, he=header, lists=p)
print('市')
o = countytr(u=url, he=header, lists=c)
print('縣')
t = towntr(u=url, he=header, lists=o)
print('鎮')
v = villagetr(u=url, he=header, lists=t)
print('村')

Python獲取全國所有的省、市、縣、鎮、村

#!/usr/bin/python3 # -*- coding: utf-8 -*- # author=He """ 通過國家統計局資料獲取中國所有城市列表 """ import sys import os import re from urllib imp

快應用之地圖——獲取全國的省/直轄市、市/區、縣

最近在學快應用哦，學的過程模仿滴滴寫頁面再加深理解和運用，發覺哦，很有趣哦。好啦，開始我們的正題。使用快應用的資料請求介面fetch(需要import哦)來向本地的服務請求資料，獲取全國的省/直轄市（相關的資料url:https://github.com/Enmeng/C

全國所有省市縣地理坐標Json格式

code 鏈接 enter json splay 示例 aid com title 示例（單個省）： [{ "citycode": [], "adcode": "460000", "name": "海南省", "center": "11

python獲取頁面所有a標籤下href的值

參考下面的連結中的內容： # -*- coding:utf-8 -*- #python 2.7 #http://tieba.baidu.com/p/2460150866 #標籤操作 from

Android模擬iOS的PickerView並且附帶全國所有省城市地區三級目錄

基於上次的修改：因為我是在專案中使用的，暫時沒有demo，但是把程式碼copy上去可以直接用了，已經完全封裝好了，大家只管用就好了：只需要一個藉口回撥就可以獲取資料了。很方便~ 先來一張效果圖吧： PickerView 的依賴地址： //Pic

Python獲取Redis所有Key以及內容

一、獲取所有Key # -*- encoding: UTF-8 -*- __author__ = "Sky" import redis pool=redis.ConnectionPool(host='127.0.0.1',port=6379,db=0) r = redi

2018年全國主要省（市）大資料產業發展情況概覽

目前我國大資料進入創新突破與應用落地的發展上升期，在提升政府治理能力，優化公共民生服務，促進經濟

python 獲取F5所有的虛擬主機

1.獲取當前F5 所有的LTM virtual servers ##my @ltm_virtuals = $ic->get_ltm_vs_list(); ##Returns an array of all defined LTM virtual servers. 返回所

獲取省、市、區的js程式碼控制

$(function() { // 初始化省市區 initAddress(); // 更改省份後的操作 $("select[name='province']").change(function() { var provCode = $("select

Java中獲取資料庫中的資料，獲取下拉列表中的資料，獲取省、市、區的資料，根據上一層去控制下一層

$(function() { //validateRule(); getDept(); $("select[name='deptNamee']").change(function() { var deptCode = $("select[name='deptN

微信小程式 - 獲取所在位置(省、市、區)

實現步驟 1. 獲取當前經緯度 2. 呼叫騰訊(百度、高德)地圖對應的請求地址，一般都會有獨一的key, 譬如騰訊地圖呼叫地址： https://apis.map.qq.com/ws/geocoder/v1/?l

二、echarts地圖從全國進省從省進市

這次講echarts地圖從全國進省從省進市 1.寫一個div <div id="main" style="height:800px"></div> 2.引入需要的js <script type="text/javascript" s

所有的字符編碼由System.Text.Encoding類獲取所有的字符編碼如Unicode編碼、 GB18030編碼、(UTF-8) 簡體中文(GB2312)

mac net 挪威 head sun -m abi cal 篩選本頁列出來目前window下所有支持的字符編碼 ---通過 System.Text.Encoding.GetEncodings()獲取，裏面可以對其進行查詢，篩選，對同一個字符，在不同編碼進行查看和分

python 獲取域名的IP、註冊時間、過期時間

域名 domain name python 註冊時間 import requests import json import asyncio import aiohttp from bs4 import BeautifulSoup import datetime result1={"baidu

用單進程、多線程並發、多線程分別實現爬一個或多個網站的所有鏈接，用瀏覽器打開所有鏈接並保存截圖 python

app imp mat 並發執行 cut h+ chrome 鏈接目錄 #coding=utf-8import requestsimport re,os,time,ConfigParserfrom selenium import webdriverfrom multipr

ajax（省、市、編碼聯動）

har append city ack 取數據 dex val 執行 set <!DOCTYPE html> <html> <head> <meta charset="UTF-8">

JQuery：省、市、區三級級聯

主要功能：實現省市區三級聯動（選擇省之後，然後可以選擇相應的市，最後可以選擇相應的區）主要技術：JQuery，js ，html 主要程式碼： <!DOCTYPE html> <html> <head> <meta charse

python獲取當天時間、昨天時間和明天時間或者n天時間（天為單位）

Python獲取今天時間： >>> datetime.datetime.now() datetime.datetime(2018, 10, 19, 21, 13, 46, 577073) >>> import time >>> t

收貨地址（省、市、縣）三級資料

2017年統計(截止2017年10月31日) [{ "name": "北京市", "code": 1, "children": [{ "name": "市轄區", "code": 257, "child

Python獲取物件資訊的函式type()、isinstance()、dir()

type()函式：使用type()函式可以判斷物件的型別，如果一個變數指向了函式或類，也可以用type判斷。如： class Student(object): name = 'Student' a = Student() print(type(123)) pr

Python獲取全國所有的省、市、縣、鎮、村

相關推薦