1. 程式人生 > 程式設計 >Python實現實時資料採集新型冠狀病毒資料例項

Python實現實時資料採集新型冠狀病毒資料例項

Python實時資料採集-新型冠狀病毒

原始碼 來源:https://github.com/Programming-With-Love/2019-nCoV

疫情資料時間為:2020.2.1

Python實現實時資料採集新型冠狀病毒資料例項

專案相關截圖:

全國資料展示

Python實現實時資料採集新型冠狀病毒資料例項

國內資料展示

Python實現實時資料採集新型冠狀病毒資料例項

國外資料展示

Python實現實時資料採集新型冠狀病毒資料例項

檢視指定區域詳細資料

Python實現實時資料採集新型冠狀病毒資料例項

原始碼,注意安裝所需模組(例如 pip install 模組名)

import requests

import re

from bs4 import BeautifulSoup

from time import sleep

import json

from prettytable import ALL

from prettytable import PrettyTable

 

hubei = {}

guangdong = {}

zhejiang = {}

beijing = {}

shanghai = {}

hunan = {}

anhui = {}

chongqing = {}

sichuan = {}

shandong = {}

guangxi = {}

fujian = {}

jiangsu = {}

henan = {}

hainan = {}

tianjin = {}

jiangxi = {}

shanxi1 = {} # 陝西

guizhou = {}

liaoning = {}

xianggang = {}

heilongjiang = {}

aomen = {}

xinjiang = {}

gansu = {}

yunnan = {}

taiwan = {}

shanxi2 = {} # 山西

jilin = {}

hebei = {}

ningxia = {}

neimenggu = {}

qinghai = {} # none

xizang = {} # none

provinces_idx = [hubei,guangdong,zhejiang,chongqing,hunan,anhui,beijing,shanghai,henan,guangxi,shandong,jiangxi,jiangsu,sichuan,liaoning,fujian,heilongjiang,hainan,tianjin,hebei,shanxi2,yunnan,xianggang,shanxi1,guizhou,jilin,gansu,taiwan,xinjiang,ningxia,aomen,neimenggu,qinghai,xizang]

map = {

  '湖北':0,'廣東':1,'浙江':2,'北京':3,'上海':4,'湖南':5,'安徽':6,'重慶':7,'四川':8,'山東':9,'廣西':10,'福建':11,'江蘇':12,'河南':13,'海南':14,'天津':15,'江西':16,'陝西':17,'貴州':18,'遼寧':19,'香港':20,'黑龍江':21,'澳門':22,'新疆':23,'甘肅':24,'雲南':25,'臺灣':26,'山西':27,'吉林':28,'河北':29,'寧夏':30,'內蒙古':31,'青海':32,'西藏':33

}

 

 

def getTime(text):

  TitleTime = str(text)

  TitleTime = re.findall('<span>(.*?)</span>',TitleTime)

  return TitleTime[0]

 

def getAllCountry(text):

  AllCountry = str(text)

  AllCountry = AllCountry.replace("[<p class=\"confirmedNumber___3WrF5\"><span class=\"content___2hIPS\">","")

  AllCountry = AllCountry.replace("<span style=\"color: #4169e2\">","")

  AllCountry = re.sub("</span>","",AllCountry)

  AllCountry = AllCountry.replace("</p>]","")

   

  AllCountry = AllCountry.replace("<span style=\"color: rgb(65,105,226);\">","")

  AllCountry = re.sub("<span>",AllCountry)

  AllCountry = re.sub("<p>",AllCountry)

  AllCountry = re.sub("</p>",AllCountry)

  return AllCountry 

 

def query(province):

  table = PrettyTable(['地區','確診','死亡','治癒'])

 

  for (k,v) in province.items():

    name = k

    table.add_row([name,v[0] if v[0] != 0 else '-',v[1] if v[1] != 0 else '-',v[2] if v[2] != 0 else '-'])

  if len(province.keys()) != 0:

    print(table)

  else:

    print("暫無")

 

def getInfo(text):

  text = str(text)

  text = re.sub("<p class=\"descText___Ui3tV\">",text)

  text = re.sub("</p>",text)

  return text

 

def is_json(json_str):

  try:

    json.loads(json_str)

  except ValueError:

    return False

  return True

 

def ff(str,num):

  return str[:num] + str[num+1:]

     

 

def main():

  url = "https://3g.dxy.cn/newh5/view/pneumonia"

 

  try:

    headers = {}

    headers['user-agent'] = 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML,like Gecko) Chrome/70.0.3538.77 Safari/537.36' #http頭大小寫不敏感

    headers['accept'] = 'text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,image/apng,*/*;q=0.8'

    headers['Connection'] = 'keep-alive'

    headers['Upgrade-Insecure-Requests'] = '1'

 

    r = requests.get(url,headers=headers)

    r.raise_for_status()

    r.encoding = r.apparent_encoding

    soup = BeautifulSoup(r.text,'lxml')

    table = PrettyTable(['地區','治癒'])

    table.hrules = ALL

 

    #### 截至時間

    # TitleTime = getTime(soup.select('.title___2d1_B'))

     

    print()

    # print("       ",TitleTime + "\n")

 

    while True:

      r = requests.get("https://service-f9fjwngp-1252021671.bj.apigw.tencentcs.com/release/pneumonia")

      json_str = json.loads(r.text)

      if json_str['error'] == 0:

        break

 

    print("==================================全國資料==================================")

    print()

     

    print("   確診 " + str(json_str['data']['statistics']['confirmedCount']) + " 例"

      + "    " + "疑似 " + str(json_str['data']['statistics']['suspectedCount']) + " 例"

      + "    " + "死亡" + str(json_str['data']['statistics']['deadCount']) + " 例"

      + "    " + "治癒" + str(json_str['data']['statistics']['curedCount']) + " 例\n")

 

    print("==================================相關情況==================================")

    print()

 

    print("傳染源:" + json_str['data']['statistics']['infectSource'])

    print("病毒:" + json_str['data']['statistics']['virus'])

    print("傳播途徑:" + json_str['data']['statistics']['passWay'])

    print(json_str['data']['statistics']['remark1'])

    print(json_str['data']['statistics']['remark2'] + "\n")

       

    print("==================================國內情況==================================")

    print()

     

    json_provinces = re.findall("{\"provinceName\":(.*?)]}",str(soup))

 

    idx = 0

    for province in json_provinces:

      if is_json(province):

        pass

 

      else:

        province = "{\"provinceName\":" + province + "]}"

        province = json.loads(province)

         

      province_name = province['provinceShortName'] if province['provinceShortName'] != 0 else '-'

      confirmed = province['confirmedCount'] if province['confirmedCount'] != 0 else '-'

      suspected = province['suspectedCount'] if province['suspectedCount'] != 0 else '-'

      cured = province['curedCount'] if province['curedCount'] != 0 else '-'

      dead = province['deadCount'] if province['deadCount'] != 0 else '-'

      table.add_row([province_name,confirmed,dead,cured])

      map[province_name] = idx

      idx = idx + 1

      for city in province['cities']:

        provinces_idx[map[province_name]][city['cityName']] = [city['confirmedCount'],city['deadCount'],city['curedCount']]

 

    print(table)

     

     

    print()

    print("==================================國外情況==================================")

    print()

 

    json_provinces = str(re.findall("\"id\":949(.*?)]}",str(soup)))

    json_provinces = json_provinces[:1] + "{\"id\":949" + json_provinces[2:]

    json_provinces = json_provinces[:len(json_provinces) - 2] + json_provinces[len(json_provinces) - 1:]

    provinces = json.loads(json_provinces)

 

    table = PrettyTable(['地區','治癒'])

    for province in provinces:

      confirmed = province['confirmedCount'] if province['confirmedCount'] != 0 else '-'

      dead = province['deadCount'] if province['deadCount'] != 0 else '-'

      cured = province['curedCount'] if province['curedCount'] != 0 else '-'

      table.add_row([province['provinceName'],cured])

     

    print(table)

    print()

     

    print("==================================最新訊息==================================")

    print()

     

       

    idx = 0

    for news in json_str['data']['timeline']:

      if idx == 5:

        break

      print(news['pubDateStr'] + " " + news['title'])

      idx = idx + 1

     

 

    print()

    key = input("請輸入您想查詢詳細資訊的省份,例如 湖北\n")

    print()

    if key in map.keys():

      query(provinces_idx[map[key]])

    else:

      print("暫無相關資訊")

       

    print("\n歡迎提出各種意見")

  except:

    print("連線失敗")

 

if __name__ == '__main__':

  main()

  sleep(30)

以上就是Python實時資料採集-新型冠狀病毒的詳細內容,大家出門要做好安全措施,感謝對我們的支援。