目录
2019年底,肺炎(COVID-19)在全球爆发,后来被确认为新型冠状病毒(SARS-CoV-2)所引发的。
我们在爬取到公开数据的条件下,开展了一些可视化工作希望能够帮助大家更好理解现在疫情的发展情况,更有信心一起战胜肆虐的病毒。
先去先找到今天要爬取的目标数据:
https://news.qq.com/zt2020/page/feiyan.htm#/


url='https://api.inews.qq.com/newsqa/v1/query/inner/publish/modules/list?modules=statisGradeCityDetail,diseaseh5Shelf'
通过爬虫获取它的json数据:
url='https://api.inews.qq.com/newsqa/v1/query/inner/publish/modules/list?modules=statisGradeCityDetail,diseaseh5Shelf'
response = requests.get(url, verify=False)
json_data = response.json()['data']
china_data = json_data['diseaseh5Shelf']['areaTree'][0]['children'] # 列表
通过一个for循环对我们的列表进行取值然后再存入到我们的字典中
data_set = []
for i in china_data:
?data_dict = {}
?# 地区名称
?data_dict['province'] = i['name']
?# 新增确认
?data_dict['nowConfirm'] = i['total']['nowConfirm']
?# 死亡人数
?data_dict['dead'] = i['total']['dead']
??? # 治愈人数
? data_dict['heal'] = i['total']['heal']
data_set.append(data_dict)
df = pd.DataFrame(data_set)
df.to_csv(‘yiqing_data.csv’)


df2 = df.sort_values(by=[‘nowConfirm’],ascending=False)[:9]
df2

bar = (
??? Bar()
??? .add_xaxis(list(df['province'].values)[:6])
??? .add_yaxis("死亡", df['dead'].values.tolist()[:6])
??? .add_yaxis("治愈", df['heal'].values.tolist()[:6])
??? .set_global_opts(
??????? title_opts=opts.TitleOpts(title="各地区确诊人数与死亡人数情况"),
??????? datazoom_opts=[opts.DataZoomOpts()],
??????? )
)
bar.render_notebook()

china_map = (
??? Map()
??? .add("现有确诊", [list(i) for i in zip(df['province'].values.tolist(),df['nowConfirm'].values.tolist())], "china")
??? .set_global_opts(
??????? title_opts=opts.TitleOpts(title="各地区确诊人数"),
??????? visualmap_opts=opts.VisualMapOpts(max_=600, is_piecewise=True),
??? )
)
china_map.render_notebook()

pie = (
??? Pie()
??? .add(
??????? "",
??????? [list(i) for i in zip(df2['province'].values.tolist(),df2['nowConfirm'].values.tolist())],
??????? radius = ["10%","30%"]
??? )
??? .set_global_opts(
??????????? legend_opts=opts.LegendOpts(orient="vertical", pos_top="70%", pos_left="70%"),
??? )
??? .set_series_opts(label_opts=opts.LabelOpts(formatter="{b}: {c}"))
)
pie.render_notebook()

line = (
??? Line()
??? .add_xaxis(list(df['province'].values))
??? .add_yaxis("治愈", df['heal'].values.tolist())
??? .add_yaxis("死亡", df['dead'].values.tolist())
??? .set_global_opts(
??????? title_opts=opts.TitleOpts(title="死亡与治愈"),
??? )
)
line.render_notebook()

import requests # 发送网络请求模块
import json
import pprint # 格式化输出模块
import pandas as pd # 数据分析当中一个非常重要的模块
from pyecharts import options as opts
from pyecharts.charts import Bar,Line,Pie,Map,Grid
import urllib3
from pyecharts.globals import CurrentConfig, NotebookType
# 配置对应的环境类型
CurrentConfig.NOTEBOOK_TYPE = NotebookType.JUPYTER_NOTEBOOK
CurrentConfig.ONLINE_HOST='https://assets.pyecharts.org/assets/'
urllib3.disable_warnings()#解决InsecureRequestWarning: Unverified HTTPS request is being made to host 'api.inews.qq.com'. 问题
url = 'https://api.inews.qq.com/newsqa/v1/query/inner/publish/modules/list?modules=statisGradeCityDetail,diseaseh5Shelf'
response = requests.get(url, verify=False)
json_data = response.json()['data']
china_data = json_data['diseaseh5Shelf']['areaTree'][0]['children'] # 列表
data_set = []
for i in china_data:
data_dict = {}
# 地区名称
data_dict['province'] = i['name']
# 新增确认
data_dict['nowConfirm'] = i['total']['nowConfirm']
# 死亡人数
data_dict['dead'] = i['total']['dead']
# 治愈人数
data_dict['heal'] = i['total']['heal']
data_set.append(data_dict)
df = pd.DataFrame(data_set)
df.to_csv('yiqing_data.csv')
df2 = df.sort_values(by=['nowConfirm'],ascending=False)[:9]
df2
# bar = (
# Bar()
# .add_xaxis(list(df['province'].values)[:6])
# .add_yaxis("死亡", df['dead'].values.tolist()[:6])
# .add_yaxis("治愈", df['heal'].values.tolist()[:6])
# .set_global_opts(
# title_opts=opts.TitleOpts(title="各地区确诊人数与死亡人数情况"),
# datazoom_opts=[opts.DataZoomOpts()],
# )
# )
# bar.render_notebook()
# china_map = (
# Map()
# .add("现有确诊", [list(i) for i in zip(df['province'].values.tolist(),df['nowConfirm'].values.tolist())], "china")
# .set_global_opts(
# title_opts=opts.TitleOpts(title="各地区确诊人数"),
# visualmap_opts=opts.VisualMapOpts(max_=600, is_piecewise=True),
# )
# )
# china_map.render_notebook()
# pie = (
# Pie()
# .add(
# "",
# [list(i) for i in zip(df2['province'].values.tolist(),df2['nowConfirm'].values.tolist())],
# radius = ["10%","30%"]
# )
# .set_global_opts(
# legend_opts=opts.LegendOpts(orient="vertical", pos_top="70%", pos_left="70%"),
# )
# .set_series_opts(label_opts=opts.LabelOpts(formatter="{b}: {c}"))
# )
# pie.render_notebook()
line = (
Line()
.add_xaxis(list(df['province'].values))
.add_yaxis("治愈", df['heal'].values.tolist())
.add_yaxis("死亡", df['dead'].values.tolist())
.set_global_opts(
title_opts=opts.TitleOpts(title="死亡与治愈"),
)
)
line.render_notebook()
先自我介绍一下,小编13年上师交大毕业,曾经在小公司待过,去过华为OPPO等大厂,18年进入阿里,直到现在。深知大多数初中级java工程师,想要升技能,往往是需要自己摸索成长或是报班学习,但对于培训机构动则近万元的学费,着实压力不小。自己不成体系的自学效率很低又漫长,而且容易碰到天花板技术停止不前。因此我收集了一份《java开发全套学习资料》送给大家,初衷也很简单,就是希望帮助到想自学又不知道该从何学起的朋友,同时减轻大家的负担。添加下方名片,即可获取全套学习资料哦