【原】用Matplotlib畫兩張花里胡哨的圖

小小明代碼實體 2021-11-30

展開全文

作者：小小明

今天要畫兩張圖，分別是：

png

代碼邏輯較為復雜，這次只展示代碼。

導包

import matplotlib.pyplot as plt
import matplotlib as mpl
import numpy as np
import pandas as pd
# 解決中文顯示問題
mpl.rcParams['font.sans-serif'] = ['SimHei']
mpl.rcParams['axes.unicode_minus'] = False

數(shù)據讀取

excel = pd.ExcelFile("旅游數(shù)據.xlsx")
df_2019 = pd.read_excel(excel, sheet_name=0)
df_2020 = pd.read_excel(excel, sheet_name=1)
df_2019["年份"] = 2019
df_2020["年份"] = 2020
display(df_2019.head())
df_2020['指標名稱'].replace('兵團', '新疆兵團', inplace=True)
df_2020.tail()

	指標名稱	代碼	本季組織人次數(shù)	本季接待人次數(shù)	本季組織人天數(shù)	本季接待人天數(shù)	年份
0	北京	1	1229139	811223	4841564	3654045	2019
1	天津	2	1108300	411033	2989315	1057598	2019
2	河北	3	813446	343793	1991293	750916	2019
3	山西	4	587867	555379	2066682	2218679	2019
4	內蒙古	5	115648	186861	461579	640426	2019

	指標名稱	代碼	本季組織人次數(shù)	本季接待人次數(shù)	本季組織人天數(shù)	本季接待人天數(shù)	年份
27	甘肅	28	83076	27911	133133	64421	2020
28	青海	29	55968	33627	65130	52868	2020
29	寧夏	30	47134	23854	78404	35521	2020
30	新疆	31	38474	20079	74410	33474	2020
31	新疆兵團	32	25759	18005	49957	39839	2020

第一張圖

plt.style.use('fivethirtyeight')
plt.figure(figsize=(20, 14))
plt.subplot(2, 1, 1)
plt.title("2019與2020年本季組織人次數(shù)前十的對比", fontsize=20)
t1 = (df_2019[["指標名稱", "本季組織人次數(shù)"]]
      .sort_values("本季組織人次數(shù)", ascending=False)
      .head(10)
      )
t2 = (df_2020[["指標名稱", "本季組織人次數(shù)"]]
      .sort_values("本季組織人次數(shù)", ascending=False)
      .head(10)
      )
plt.plot(range(10), t1['本季組織人次數(shù)'], linewidth=2,
         label='2019', marker='o', markersize=8)
plt.plot(range(10), t2['本季組織人次數(shù)'], linewidth=2,
         label='2020', marker='s', markersize=8)
plt.fill_between(range(10), t1['本季組織人次數(shù)'], t2['本季組織人次數(shù)'],
                 color="gray", alpha=0.2, label="area")
plt.legend(['2019', '2020'], fontsize=20)
plt.grid(b=True)
for x, (city, y) in enumerate(t1[["指標名稱", "本季組織人次數(shù)"]].values):
    plt.text(x, y, f"{city}:\n{y/10000:.2f}萬", fontsize=15,
             horizontalalignment='center', verticalalignment='center')
for x, (city, y) in enumerate(t2[["指標名稱", "本季組織人次數(shù)"]].values):
    plt.text(x, y, f"{city}:\n{y/10000:.2f}萬", fontsize=15,
             horizontalalignment='center', verticalalignment='center')
plt.xticks(range(10), [f"第{i}名" for i in range(1, 11)], fontsize=15)
plt.yticks(range(0, 6500000, 500000), [
           f"{i//10000}萬" for i in range(0, 6500000, 500000)], fontsize=15)

plt.subplot(2, 2, 3)
plt.title("2019與2020年四座城市的本季組織人次數(shù)對比", fontsize=20)
t1 = df_2019.loc[df_2019["指標名稱"].isin(["北京", "天津", "上海", "重慶"]), [
    "指標名稱", "本季組織人次數(shù)"]]
t2 = df_2020.loc[df_2020["指標名稱"].isin(["北京", "天津", "上海", "重慶"]), [
    "指標名稱", "本季組織人次數(shù)"]]
index = np.arange(4)
plt.bar(index, t1['本季組織人次數(shù)'], width=0.4, label='2019')
plt.bar(index+0.4, t2['本季組織人次數(shù)'], width=0.4, label='2020')
cutoff_postion = t1["本季組織人次數(shù)"].reset_index(
    drop=True).sort_values(ascending=False).index[:2]
x, y = cutoff_postion[0], t1["本季組織人次數(shù)"].iat[cutoff_postion[1]]
plt.plot(np.array([-0.2, -0.1, 0.1, 0.2])+x,
         np.array([0, 1, -1, 0])*y*0.04+y, color="white")

plt.legend(fontsize=15)
plt.grid(b=True, axis='y')
plt.xticks(index+0.2, t1['指標名稱'], fontsize=15)
plt.yticks(range(0, 4000000, 500000), [
           f"{i//10000}萬" for i in range(0, 4000000, 500000)], fontsize=15)
for x, (y1, y2) in enumerate(zip(t1["本季組織人次數(shù)"], t2["本季組織人次數(shù)"])):
    plt.text(x, y1, f"{y1/10000:.2f}萬", verticalalignment='bottom',
             horizontalalignment='center', fontsize=15)
    plt.text(x+0.4, y2, f"{y2/10000:.2f}萬", verticalalignment='bottom',
             horizontalalignment='center', fontsize=15)

plt.subplot(2, 2, 4)
plt.title("2019與2020年四座城市的本季接待人次數(shù)對比", fontsize=20)
t1 = df_2019.loc[df_2019["指標名稱"].isin(["北京", "天津", "上海", "重慶"]), [
    "指標名稱", "本季接待人次數(shù)"]]
t2 = df_2020.loc[df_2020["指標名稱"].isin(["北京", "天津", "上海", "重慶"]), [
    "指標名稱", "本季接待人次數(shù)"]]
index = np.arange(4)
plt.bar(index, t1['本季接待人次數(shù)'], width=0.4, label='2019')
plt.bar(index+0.4, t2['本季接待人次數(shù)'], width=0.4, label='2020')
cutoff_postion = t1["本季接待人次數(shù)"].reset_index(
    drop=True).sort_values(ascending=False).index[:2]
x, y = cutoff_postion[0], t1["本季接待人次數(shù)"].iat[cutoff_postion[1]]
plt.plot(np.array([-0.2, -0.1, 0.1, 0.2])+x,
         np.array([0, 1, -1, 0])*y*0.04+y, color="white")

plt.legend(fontsize=15)
plt.grid(b=True, axis='y')
plt.xticks(index+0.2, t1['指標名稱'], fontsize=15)
plt.yticks(range(0, 3000000, 500000), [
           f"{i//10000}萬" for i in range(0, 3000000, 500000)], fontsize=15)
for x, (y1, y2) in enumerate(zip(t1["本季接待人次數(shù)"], t2["本季接待人次數(shù)"])):
    plt.text(x, y1, f"{y1/10000:.2f}萬", verticalalignment='bottom',
             horizontalalignment='center', fontsize=15)
    plt.text(x+0.4, y2, f"{y2/10000:.2f}萬", verticalalignment='bottom',
             horizontalalignment='center', fontsize=15)
plt.subplots_adjust(wspace=0.1, hspace=0.15)
plt.show()

png

第二張圖

plt.style.use('fivethirtyeight')
plt.figure(figsize=(20, 20))
plt.subplot(3, 2, 1)
df_tmp = pd.concat([df_2019, df_2020]).groupby("年份").sum().drop(columns="代碼").T
plt.title("四項指標總和年度對比", fontsize=15)
index = np.arange(4)
plt.bar(index, df_tmp[2019], width=0.4, label='2019')
plt.bar(index+0.4, df_tmp[2020], width=0.4, label='2020')
plt.plot(index+0.4, df_tmp[2020], linewidth=2, color='orange')
plt.legend(title="年份")
plt.grid(b=True)
for x, (y1, y2) in enumerate(df_tmp.values):
    plt.text(x, y1, f"{y1/1e4:.1f}萬", verticalalignment='bottom',
             horizontalalignment='center')
    plt.text(x+0.4, y2, f"{y2/1e4:.1f}萬", verticalalignment='bottom',
             horizontalalignment='center')
plt.xticks(index+0.2, df_tmp.index)
plt.yticks(np.arange(0, 1.4e8, 1e7), [
           f"{i//1e4:.0f}萬" for i in np.arange(0, 1.4e8, 1e7)], fontsize=15)

plt.subplot(3, 2, 2)
plt.title("中部地帶本季組織人次數(shù)年度對比", fontsize=15)
df_tmp = pd.concat([df_2019[["指標名稱", "本季組織人次數(shù)"]].set_index("指標名稱"),
                    df_2020[["指標名稱", "本季組織人次數(shù)"]].set_index("指標名稱")], axis=1)
df_tmp.columns = [2019, 2020]
df_tmp = df_tmp.loc[["黑龍江", "吉林", "山西", "內蒙古", "安徽", "河南", "湖北", "湖南", "江西"]]
plt.barh(df_tmp.index, df_tmp[2019], label='2019')
plt.barh(df_tmp.index, -df_tmp[2020], label='2020')
plt.legend(title="年份", loc='lower right')
plt.grid(b=True)
plt.xticks(np.arange(-1e6, 2.7e6, 4e5), [
           f"{abs(i)//1e4:.0f}萬" for i in np.arange(-1e6, 2.7e6, 4e5)], fontsize=15)
for y, (x1, x2) in enumerate(df_tmp.values):
    plt.text(x1, y, f"{x1/1e4:.1f}萬", verticalalignment='center',
             horizontalalignment='left')
    plt.text(-x2, y, f"{x2/1e4:.1f}萬", verticalalignment='center',
             horizontalalignment='right')
plt.xlim([-1.1e6, 2.7e6])

plt.subplot(3, 2, 3)
df_tmp = pd.concat([df_2019[["指標名稱", "本季接待人次數(shù)"]].set_index("指標名稱"),
                    df_2020[["指標名稱", "本季接待人次數(shù)"]].set_index("指標名稱")], axis=1)
df_tmp.columns = [2019, 2020]
df_tmp.columns.name = "年份"
df_tmp = df_tmp.loc[["遼寧", "河北", "天津", "北京", "山東",
                     "江蘇", "上海", "浙江", "福建", "廣東", "廣西", "海南"]]
s = df_tmp[2019]/10000
radius_s = ((s-s.min())/(s.max()-s.min())+0.8).values
wedges, texts1, texts2 = plt.pie(
    s,  # 數(shù)據
    explode=[0.1]*df_tmp.shape[0],  # 指定每部分的偏移量
    labels=df_tmp.index,  # 標簽
    autopct="%.2f萬",  # 餅圖上的數(shù)據標簽顯示方式
    pctdistance=0.6,  # 每個餅切片的中心和通過autopct生成的文本開始之間的比例
    labeldistance=1,  # 被畫餅標記的直徑,默認值：1.1
    shadow=True,  # 陰影
    startangle=0,  # 開始角度
    radius=1.8,  # 半徑
    frame=False,  # 圖框
    counterclock=True,  # 指定指針方向，順時針或者逆時針
)
for i, wedge in enumerate(wedges):
    wedge.set_radius(radius_s[i])
for i, text in enumerate(texts1):
    text.set_position(
        tuple(map(lambda x: x*radius_s[i]/1.7, text.get_position())))
for i, text in enumerate(texts2):
    if radius_s[i] < 0.9:
        text.set_text("")
        continue
    text.set_position(
        tuple(map(lambda x: x*radius_s[i]/2, text.get_position())))

plt.subplot(3, 2, 4)
# plt.title("2020年東部沿海地帶本季接待人次數(shù)", fontsize=15)
s = df_tmp[2020]/10000
radius_s = ((s-s.min())/(s.max()-s.min())+0.8).values
wedges, texts1, texts2 = plt.pie(
    s,  # 數(shù)據
    explode=[0.1]*df_tmp.shape[0],  # 指定每部分的偏移量
    labels=df_tmp.index,  # 標簽
    autopct="%.2f萬",  # 餅圖上的數(shù)據標簽顯示方式
    pctdistance=0.6,  # 每個餅切片的中心和通過autopct生成的文本開始之間的比例
    labeldistance=1,  # 被畫餅標記的直徑,默認值：1.1
    shadow=True,  # 陰影
    startangle=0,  # 開始角度
    radius=1.8,  # 半徑
    frame=False,  # 圖框
    counterclock=True,  # 指定指針方向，順時針或者逆時針
)
for i, wedge in enumerate(wedges):
    wedge.set_radius(radius_s[i])
for i, text in enumerate(texts1):
    if radius_s[i] < 0.83:
        text.set_text("")
        continue
    text.set_position(
        tuple(map(lambda x: x*radius_s[i]/1.7, text.get_position())))
for i, text in enumerate(texts2):
    if radius_s[i] < 0.87:
        text.set_text("")
        continue
    text.set_position(
        tuple(map(lambda x: x*radius_s[i]/2, text.get_position())))


plt.subplot(3, 1, 3)
plt.title("西部地帶本季接待人天數(shù)氣泡圖", fontsize=15)
df_tmp = pd.concat([df_2019[["指標名稱", "本季接待人天數(shù)"]].set_index("指標名稱"),
                    df_2020[["指標名稱", "本季接待人天數(shù)"]].set_index("指標名稱")], axis=1)
df_tmp.columns = [2019, 2020]
df_tmp.columns.name = "年份"
df_tmp = df_tmp.loc[["陜西", "甘肅", "寧夏", "青海",
                     "新疆", "重慶", "四川", "云南", "貴州", "西藏"]]
index = range(df_tmp.shape[0])
plt.scatter(
    index,
    [2]*df_tmp.shape[0],  # 按照經緯度顯示
    s=df_tmp[2019] / 1000,  # 按照單價顯示大小
    c=range(df_tmp.shape[0]),  # 按照總價顯示顏色
    alpha=0.6,
    cmap="jet",
)
plt.scatter(
    index,
    [1]*df_tmp.shape[0],  # 按照經緯度顯示
    s=df_tmp[2020] / 1000,  # 按照單價顯示大小
    c=range(df_tmp.shape[0]),  # 按照總價顯示顏色
    alpha=0.6,
    cmap="jet",
)
for i, (v1, v2) in enumerate(df_tmp.values):
    plt.text(i, 2, f"{v1/10000:.0f}萬", verticalalignment='center',
             horizontalalignment='center', fontsize=15)
    plt.text(i, 1, f"{v2/10000:.0f}萬", verticalalignment='bottom',
             horizontalalignment='center', fontsize=15)
plt.xticks(index, df_tmp.index)
plt.yticks([1, 2], [2020, 2019])
plt.ylim([0.5, 2.5])

plt.subplots_adjust(wspace=0.1, hspace=0.4)
plt.show()

png

贊賞

共11人贊賞

小男孩‘自慰网亚洲一区二区,亚洲一级在线播放毛片,亚洲中文字幕av每天更新,黄aⅴ永久免费无码,91成人午夜在线精品,色网站免费在线观看,亚洲欧洲wwwww在线观看

【原】用Matplotlib畫兩張花里胡哨的圖

導包

數(shù)據讀取

第一張圖

第二張圖