Python實現實時資料採集新型冠狀病毒資料例項
阿新 • • 發佈:2020-02-05
Python實時資料採集-新型冠狀病毒
原始碼 來源:https://github.com/Programming-With-Love/2019-nCoV
疫情資料時間為:2020.2.1
專案相關截圖:
全國資料展示
國內資料展示
國外資料展示
檢視指定區域詳細資料
原始碼,注意安裝所需模組(例如 pip install 模組名)
import requests import re from bs4 import BeautifulSoup from time import sleep import json from prettytable import ALL from prettytable import PrettyTable hubei = {} guangdong = {} zhejiang = {} beijing = {} shanghai = {} hunan = {} anhui = {} chongqing = {} sichuan = {} shandong = {} guangxi = {} fujian = {} jiangsu = {} henan = {} hainan = {} tianjin = {} jiangxi = {} shanxi1 = {} # 陝西 guizhou = {} liaoning = {} xianggang = {} heilongjiang = {} aomen = {} xinjiang = {} gansu = {} yunnan = {} taiwan = {} shanxi2 = {} # 山西 jilin = {} hebei = {} ningxia = {} neimenggu = {} qinghai = {} # none xizang = {} # none provinces_idx = [hubei,guangdong,zhejiang,chongqing,hunan,anhui,beijing,shanghai,henan,guangxi,shandong,jiangxi,jiangsu,sichuan,liaoning,fujian,heilongjiang,hainan,tianjin,hebei,shanxi2,yunnan,xianggang,shanxi1,guizhou,jilin,gansu,taiwan,xinjiang,ningxia,aomen,neimenggu,qinghai,xizang] map = { '湖北':0,'廣東':1,'浙江':2,'北京':3,'上海':4,'湖南':5,'安徽':6,'重慶':7,'四川':8,'山東':9,'廣西':10,'福建':11,'江蘇':12,'河南':13,'海南':14,'天津':15,'江西':16,'陝西':17,'貴州':18,'遼寧':19,'香港':20,'黑龍江':21,'澳門':22,'新疆':23,'甘肅':24,'雲南':25,'臺灣':26,'山西':27,'吉林':28,'河北':29,'寧夏':30,'內蒙古':31,'青海':32,'西藏':33 } def getTime(text): TitleTime = str(text) TitleTime = re.findall('<span>(.*?)</span>',TitleTime) return TitleTime[0] def getAllCountry(text): AllCountry = str(text) AllCountry = AllCountry.replace("[<p class=\"confirmedNumber___3WrF5\"><span class=\"content___2hIPS\">","") AllCountry = AllCountry.replace("<span style=\"color: #4169e2\">","") AllCountry = re.sub("</span>","",AllCountry) AllCountry = AllCountry.replace("</p>]","") AllCountry = AllCountry.replace("<span style=\"color: rgb(65,105,226);\">","") AllCountry = re.sub("<span>",AllCountry) AllCountry = re.sub("<p>",AllCountry) AllCountry = re.sub("</p>",AllCountry) return AllCountry def query(province): table = PrettyTable(['地區','確診','死亡','治癒']) for (k,v) in province.items(): name = k table.add_row([name,v[0] if v[0] != 0 else '-',v[1] if v[1] != 0 else '-',v[2] if v[2] != 0 else '-']) if len(province.keys()) != 0: print(table) else: print("暫無") def getInfo(text): text = str(text) text = re.sub("<p class=\"descText___Ui3tV\">",text) text = re.sub("</p>",text) return text def is_json(json_str): try: json.loads(json_str) except ValueError: return False return True def ff(str,num): return str[:num] + str[num+1:] def main(): url = "https://3g.dxy.cn/newh5/view/pneumonia" try: headers = {} headers['user-agent'] = 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML,like Gecko) Chrome/70.0.3538.77 Safari/537.36' #http頭大小寫不敏感 headers['accept'] = 'text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,image/apng,*/*;q=0.8' headers['Connection'] = 'keep-alive' headers['Upgrade-Insecure-Requests'] = '1' r = requests.get(url,headers=headers) r.raise_for_status() r.encoding = r.apparent_encoding soup = BeautifulSoup(r.text,'lxml') table = PrettyTable(['地區','治癒']) table.hrules = ALL #### 截至時間 # TitleTime = getTime(soup.select('.title___2d1_B')) print() # print(" ",TitleTime + "\n") while True: r = requests.get("https://service-f9fjwngp-1252021671.bj.apigw.tencentcs.com/release/pneumonia") json_str = json.loads(r.text) if json_str['error'] == 0: break print("==================================全國資料==================================") print() print(" 確診 " + str(json_str['data']['statistics']['confirmedCount']) + " 例" + " " + "疑似 " + str(json_str['data']['statistics']['suspectedCount']) + " 例" + " " + "死亡" + str(json_str['data']['statistics']['deadCount']) + " 例" + " " + "治癒" + str(json_str['data']['statistics']['curedCount']) + " 例\n") print("==================================相關情況==================================") print() print("傳染源:" + json_str['data']['statistics']['infectSource']) print("病毒:" + json_str['data']['statistics']['virus']) print("傳播途徑:" + json_str['data']['statistics']['passWay']) print(json_str['data']['statistics']['remark1']) print(json_str['data']['statistics']['remark2'] + "\n") print("==================================國內情況==================================") print() json_provinces = re.findall("{\"provinceName\":(.*?)]}",str(soup)) idx = 0 for province in json_provinces: if is_json(province): pass else: province = "{\"provinceName\":" + province + "]}" province = json.loads(province) province_name = province['provinceShortName'] if province['provinceShortName'] != 0 else '-' confirmed = province['confirmedCount'] if province['confirmedCount'] != 0 else '-' suspected = province['suspectedCount'] if province['suspectedCount'] != 0 else '-' cured = province['curedCount'] if province['curedCount'] != 0 else '-' dead = province['deadCount'] if province['deadCount'] != 0 else '-' table.add_row([province_name,confirmed,dead,cured]) map[province_name] = idx idx = idx + 1 for city in province['cities']: provinces_idx[map[province_name]][city['cityName']] = [city['confirmedCount'],city['deadCount'],city['curedCount']] print(table) print() print("==================================國外情況==================================") print() json_provinces = str(re.findall("\"id\":949(.*?)]}",str(soup))) json_provinces = json_provinces[:1] + "{\"id\":949" + json_provinces[2:] json_provinces = json_provinces[:len(json_provinces) - 2] + json_provinces[len(json_provinces) - 1:] provinces = json.loads(json_provinces) table = PrettyTable(['地區','治癒']) for province in provinces: confirmed = province['confirmedCount'] if province['confirmedCount'] != 0 else '-' dead = province['deadCount'] if province['deadCount'] != 0 else '-' cured = province['curedCount'] if province['curedCount'] != 0 else '-' table.add_row([province['provinceName'],cured]) print(table) print() print("==================================最新訊息==================================") print() idx = 0 for news in json_str['data']['timeline']: if idx == 5: break print(news['pubDateStr'] + " " + news['title']) idx = idx + 1 print() key = input("請輸入您想查詢詳細資訊的省份,例如 湖北\n") print() if key in map.keys(): query(provinces_idx[map[key]]) else: print("暫無相關資訊") print("\n歡迎提出各種意見") except: print("連線失敗") if __name__ == '__main__': main() sleep(30)
以上就是Python實時資料採集-新型冠狀病毒的詳細內容,大家出門要做好安全措施,感謝對我們的支援。