1. 程式人生 > 實用技巧 >STP生成樹實驗

STP生成樹實驗

更多python教程請到: 菜鳥教程www.piaodoo.com

人人影視www.sfkyty.com


Python實時資料採集-新型冠狀病毒

原始碼 來源:https://github.com/Programming-With-Love/2019-nCoV

疫情資料時間為:2020.2.1

專案相關截圖:

全國資料展示

國內資料展示

國外資料展示

檢視指定區域詳細資料

原始碼,注意安裝所需模組(例如 pip install 模組名)

import requests

import re

from bs4 import BeautifulSoup

from time import sleep

import json

from prettytable import ALL

from prettytable import PrettyTable

hubei = {}

guangdong = {}

zhejiang = {}

beijing = {}

shanghai = {}

hunan = {}

anhui = {}

chongqing = {}

sichuan = {}

shandong = {}

guangxi = {}

fujian = {}

jiangsu = {}

henan = {}

hainan = {}

tianjin = {}

jiangxi = {}

shanxi1 = {} # 陝西

guizhou = {}

liaoning = {}

xianggang = {}

heilongjiang = {}

aomen = {}

xinjiang = {}

gansu = {}

yunnan = {}

taiwan = {}

shanxi2 = {} # 山西

jilin = {}

hebei = {}

ningxia = {}

neimenggu = {}

qinghai = {} # none

xizang = {} # none

provinces_idx = [hubei, guangdong, zhejiang, chongqing, hunan, anhui, beijing,

     shanghai, henan, guangxi, shandong, jiangxi, jiangsu, sichuan,

     liaoning, fujian, heilongjiang, hainan, tianjin, hebei, shanxi2,

     yunnan, xianggang, shanxi1, guizhou, jilin, gansu, taiwan,

     xinjiang, ningxia, aomen, neimenggu, qinghai, xizang]

map = {

'湖北':0, '廣東':1, '浙江':2, '北京':3, '上海':4, '湖南':5, '安徽':6, '重慶':7,

'四川':8, '山東':9, '廣西':10, '福建':11, '江蘇':12, '河南':13, '海南':14,

'天津':15, '江西':16, '陝西':17, '貴州':18, '遼寧':19, '香港':20, '黑龍江':21,

'澳門':22, '新疆':23, '甘肅':24, '雲南':25, '臺灣':26, '山西':27, '吉林':28,

'河北':29, '寧夏':30, '內蒙古':31, '青海':32, '西藏':33

}

def getTime(text):

TitleTime = str(text)

TitleTime = re.findall('<span>(.*?)</span>', TitleTime)

return TitleTime[0]

def getAllCountry(text):

AllCountry = str(text)

AllCountry = AllCountry.replace("[<p class="confirmedNumber___3WrF5"><span class="content___2hIPS">", "")

AllCountry = AllCountry.replace("<span style="color: #4169e2">", "")

AllCountry = re.sub("</span>", "", AllCountry)

AllCountry = AllCountry.replace("</p>]", "")

AllCountry = AllCountry.replace("<span style="color: rgb(65, 105, 226);">", "")

AllCountry = re.sub("<span>", "", AllCountry)

AllCountry = re.sub("<p>", "", AllCountry)

AllCountry = re.sub("</p>", "", AllCountry)

return AllCountry

def query(province):

table = PrettyTable(['地區', '確診', '死亡', '治癒'])

for (k, v) in province.items():

name = k

table.add_row([name, v[0] if v[0] != 0 else '-', v[1] if v[1] != 0 else '-', v[2] if v[2] != 0 else '-'])

if len(province.keys()) != 0:

print(table)

else:

print("暫無")

def getInfo(text):

text = str(text)

text = re.sub("<p class="descText___Ui3tV">", "", text)

text = re.sub("</p>", "", text)

return text

def is_json(json_str):

try:

json.loads(json_str)

except ValueError:

return False

return True

def ff(str, num):

return str[:num] + str[num+1:]

def main():

url = "https://3g.dxy.cn/newh5/view/pneumonia"

try:

headers = {}

headers['user-agent'] = 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/70.0.3538.77 Safari/537.36' #http頭大小寫不敏感

headers['accept'] = 'text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,image/apng,*/*;q=0.8'

headers['Connection'] = 'keep-alive'

headers['Upgrade-Insecure-Requests'] = '1'



r = requests.get(url, headers=headers)

r.raise_for_status()

r.encoding = r.apparent_encoding

soup = BeautifulSoup(r.text,'lxml')

table = PrettyTable(['地區', '確診', '死亡', '治癒'])

table.hrules = ALL



#### 截至時間

# TitleTime = getTime(soup.select('.title___2d1_B'))

 

print()

# print("       ",TitleTime + "\n")



while True:

  r = requests.get("https://service-f9fjwngp-1252021671.bj.apigw.tencentcs.com/release/pneumonia")

  json_str = json.loads(r.text)

  if json_str['error'] == 0:

    break



print("==================================全國資料==================================")

print()

 

print("   確診 " + str(json_str['data']['statistics']['confirmedCount']) + " 例"

  + "    " + "疑似 " + str(json_str['data']['statistics']['suspectedCount']) + " 例"

  + "    " + "死亡" + str(json_str['data']['statistics']['deadCount']) + " 例"

  + "    " + "治癒" + str(json_str['data']['statistics']['curedCount']) + " 例\n")



print("==================================相關情況==================================")

print()



print("傳染源:" + json_str['data']['statistics']['infectSource'])

print("病毒:" + json_str['data']['statistics']['virus'])

print("傳播途徑:" + json_str['data']['statistics']['passWay'])

print(json_str['data']['statistics']['remark1'])

print(json_str['data']['statistics']['remark2'] + "\n")

   

print("==================================國內情況==================================")

print()

 

json_provinces = re.findall("{\"provinceName\":(.*&#63;)]}", str(soup))



idx = 0

for province in json_provinces:

  if is_json(province):

    pass



  else:

    province = "{\"provinceName\":" + province + "]}"

    province = json.loads(province)

     

  province_name = province['provinceShortName'] if province['provinceShortName'] != 0 else '-'

  confirmed = province['confirmedCount'] if province['confirmedCount'] != 0 else '-'

  suspected = province['suspectedCount'] if province['suspectedCount'] != 0 else '-'

  cured = province['curedCount'] if province['curedCount'] != 0 else '-'

  dead = province['deadCount'] if province['deadCount'] != 0 else '-'

  table.add_row([province_name, confirmed, dead, cured])

  map[province_name] = idx

  idx = idx + 1

  for city in province['cities']:

    provinces_idx[map[province_name]][city['cityName']] = [city['confirmedCount'], city['deadCount'], city['curedCount']]



print(table)

 

 

print()

print("==================================國外情況==================================")

print()



json_provinces = str(re.findall("\"id\":949(.*&#63;)]}", str(soup)))

json_provinces = json_provinces[:1] + "{\"id\":949" + json_provinces[2:]

json_provinces = json_provinces[:len(json_provinces) - 2] + json_provinces[len(json_provinces) - 1:]

provinces = json.loads(json_provinces)



table = PrettyTable(['地區', '確診', '死亡', '治癒'])

for province in provinces:

  confirmed = province['confirmedCount'] if province['confirmedCount'] != 0 else '-'

  dead = province['deadCount'] if province['deadCount'] != 0 else '-'

  cured = province['curedCount'] if province['curedCount'] != 0 else '-'

  table.add_row([province['provinceName'], confirmed, dead, cured])

 

print(table)

print()

 

print("==================================最新訊息==================================")

print()

 

   

idx = 0

for news in json_str['data']['timeline']:

  if idx == 5:

    break

  print(news['pubDateStr'] + " " + news['title'])

  idx = idx + 1

 



print()

key = input("請輸入您想查詢詳細資訊的省份,例如 湖北\n")

print()

if key in map.keys():

  query(provinces_idx[map[key]])

else:

  print("暫無相關資訊")

   

print("\n歡迎提出各種意見")

except:

print("連線失敗")

if name == 'main':

main()

sleep(30)

以上就是Python實時資料採集-新型冠狀病毒的詳細內容,大家出門要做好安全措施,感謝對菜鳥教程www.piaodoo.com的支援。