Python+matplotlib实现折线图的美化
作者:Python学习与数据挖掘 发布时间:2023-09-05 20:03:18
标签:Python,matplotlib,折线图
大家好,今天分享一个非常有趣的 Python 教程,如何美化一个 matplotlib 折线图,喜欢记得收藏、关注、点赞。
1. 导入包
import pandas as pd
import matplotlib.pyplot as plt
import matplotlib.ticker as ticker
import matplotlib.gridspec as gridspec
2. 获得数据
file_id = '1yM_F93NY4QkxjlKL3GzdcCQEnBiA2ltB'
url = f'https://drive.google.com/uc?id={file_id}'
df = pd.read_csv(url, index_col=0)
df
数据长得是这样的:
3. 对数据做一些预处理
按照需要,对数据再做一些预处理,代码及效果如下:
home_df = df.copy()
home_df = home_df.melt(id_vars = ["date", "home_team_name", "away_team_name"])
home_df["venue"] = "H"
home_df.rename(columns = {"home_team_name":"team", "away_team_name":"opponent"}, inplace = True)
home_df.replace({"variable":{"home_team_xG":"xG_for", "away_team_xG":"xG_ag"}}, inplace = True)
away_df = df.copy()
away_df = away_df.melt(id_vars = ["date", "away_team_name", "home_team_name"])
away_df["venue"] = "A"
away_df.rename(columns = {"away_team_name":"team", "home_team_name":"opponent"}, inplace = True)
away_df.replace({"variable":{"away_team_xG":"xG_for", "home_team_xG":"xG_ag"}}, inplace = True)
df = pd.concat([home_df, away_df]).reset_index(drop = True)
df
4. 画图
# ---- Filter the data
Y_for = df[(df["team"] == "Lazio") & (df["variable"] == "xG_for")]["value"].reset_index(drop = True)
Y_ag = df[(df["team"] == "Lazio") & (df["variable"] == "xG_ag")]["value"].reset_index(drop = True)
X_ = pd.Series(range(len(Y_for)))
# ---- Compute rolling average
Y_for = Y_for.rolling(window = 5, min_periods = 0).mean() # min_periods is for partial avg.
Y_ag = Y_ag.rolling(window = 5, min_periods = 0).mean()
fig, ax = plt.subplots(figsize = (7,3), dpi = 200)
ax.plot(X_, Y_for)
ax.plot(X_, Y_ag)
使用matplotlib倒是可以快速把图画好了,但是太丑了。接下来进行优化。
4.1 优化:添加点
这里为每一个数据添加点
fig, ax = plt.subplots(figsize = (7,3), dpi = 200)
# --- Remove spines and add gridlines
ax.spines["left"].set_visible(False)
ax.spines["top"].set_visible(False)
ax.spines["right"].set_visible(False)
ax.grid(ls = "--", lw = 0.5, color = "#4E616C")
# --- The data
ax.plot(X_, Y_for, marker = "o")
ax.plot(X_, Y_ag, marker = "o")
4.2 优化:设置刻度
fig, ax = plt.subplots(figsize = (7,3), dpi = 200)
# --- Remove spines and add gridlines
ax.spines["left"].set_visible(False)
ax.spines["top"].set_visible(False)
ax.spines["right"].set_visible(False)
ax.grid(ls = "--", lw = 0.25, color = "#4E616C")
# --- The data
ax.plot(X_, Y_for, marker = "o", mfc = "white", ms = 5)
ax.plot(X_, Y_ag, marker = "o", mfc = "white", ms = 5)
# --- Adjust tickers and spine to match the style of our grid
ax.xaxis.set_major_locator(ticker.MultipleLocator(2)) # ticker every 2 matchdays
xticks_ = ax.xaxis.set_ticklabels([x - 1 for x in range(0, len(X_) + 3, 2)])
# This last line outputs
# [-1, 1, 3, 5, 7, 9, 11, 13, 15, 17, 19, 21, 23, 25, 27, 29, 31, 33, 35]
# and we mark the tickers every two positions.
ax.xaxis.set_tick_params(length = 2, color = "#4E616C", labelcolor = "#4E616C", labelsize = 6)
ax.yaxis.set_tick_params(length = 2, color = "#4E616C", labelcolor = "#4E616C", labelsize = 6)
ax.spines["bottom"].set_edgecolor("#4E616C")
4.3 优化:设置填充
fig, ax = plt.subplots(figsize = (7,3), dpi = 200)
# --- Remove spines and add gridlines
ax.spines["left"].set_visible(False)
ax.spines["top"].set_visible(False)
ax.spines["right"].set_visible(False)
ax.grid(ls = "--", lw = 0.25, color = "#4E616C")
# --- The data
ax.plot(X_, Y_for, marker = "o", mfc = "white", ms = 5)
ax.plot(X_, Y_ag, marker = "o", mfc = "white", ms = 5)
# --- Fill between
ax.fill_between(x = X_, y1 = Y_for, y2 = Y_ag, alpha = 0.5)
# --- Adjust tickers and spine to match the style of our grid
ax.xaxis.set_major_locator(ticker.MultipleLocator(2)) # ticker every 2 matchdays
xticks_ = ax.xaxis.set_ticklabels([x - 1 for x in range(0, len(X_) + 3, 2)])
ax.xaxis.set_tick_params(length = 2, color = "#4E616C", labelcolor = "#4E616C", labelsize = 6)
ax.yaxis.set_tick_params(length = 2, color = "#4E616C", labelcolor = "#4E616C", labelsize = 6)
ax.spines["bottom"].set_edgecolor("#4E616C")
4.4 优化:设置填充颜色
1.当橙色线更高时,希望填充为橙色。但是上面的还无法满足,这里再优化一下.
fig, ax = plt.subplots(figsize = (7,3), dpi = 200)
# --- Remove spines and add gridlines
ax.spines["left"].set_visible(False)
ax.spines["top"].set_visible(False)
ax.spines["right"].set_visible(False)
ax.grid(ls = "--", lw = 0.25, color = "#4E616C")
# --- The data
ax.plot(X_, Y_for, marker = "o", mfc = "white", ms = 5)
ax.plot(X_, Y_ag, marker = "o", mfc = "white", ms = 5)
# --- Fill between
# Identify points where Y_for > Y_ag
pos_for = (Y_for > Y_ag)
ax.fill_between(x = X_[pos_for], y1 = Y_for[pos_for], y2 = Y_ag[pos_for], alpha = 0.5)
pos_ag = (Y_for <= Y_ag)
ax.fill_between(x = X_[pos_ag], y1 = Y_for[pos_ag], y2 = Y_ag[pos_ag], alpha = 0.5)
# --- Adjust tickers and spine to match the style of our grid
ax.xaxis.set_major_locator(ticker.MultipleLocator(2)) # ticker every 2 matchdays
xticks_ = ax.xaxis.set_ticklabels([x - 1 for x in range(0, len(X_) + 3, 2)])
ax.xaxis.set_tick_params(length = 2, color = "#4E616C", labelcolor = "#4E616C", labelsize = 6)
ax.yaxis.set_tick_params(length = 2, color = "#4E616C", labelcolor = "#4E616C", labelsize = 6)
ax.spines["bottom"].set_edgecolor("#4E616C")
上面的图出现异常,再修改一下:
X_aux = X_.copy()
X_aux.index = X_aux.index * 10 # 9 aux points in between each match
last_idx = X_aux.index[-1] + 1
X_aux = X_aux.reindex(range(last_idx))
X_aux = X_aux.interpolate()
# --- Aux series for the xG created (Y_for)
Y_for_aux = Y_for.copy()
Y_for_aux.index = Y_for_aux.index * 10
last_idx = Y_for_aux.index[-1] + 1
Y_for_aux = Y_for_aux.reindex(range(last_idx))
Y_for_aux = Y_for_aux.interpolate()
# --- Aux series for the xG conceded (Y_ag)
Y_ag_aux = Y_ag.copy()
Y_ag_aux.index = Y_ag_aux.index * 10
last_idx = Y_ag_aux.index[-1] + 1
Y_ag_aux = Y_ag_aux.reindex(range(last_idx))
Y_ag_aux = Y_ag_aux.interpolate()
fig, ax = plt.subplots(figsize = (7,3), dpi = 200)
# --- Remove spines and add gridlines
ax.spines["left"].set_visible(False)
ax.spines["top"].set_visible(False)
ax.spines["right"].set_visible(False)
ax.grid(ls = "--", lw = 0.25, color = "#4E616C")
# --- The data
for_ = ax.plot(X_, Y_for, marker = "o", mfc = "white", ms = 5)
ag_ = ax.plot(X_, Y_ag, marker = "o", mfc = "white", ms = 5)
# --- Fill between
for index in range(len(X_aux) - 1):
# Choose color based on which line's on top
if Y_for_aux.iloc[index + 1] > Y_ag_aux.iloc[index + 1]:
color = for_[0].get_color()
else:
color = ag_[0].get_color()
# Fill between the current point and the next point in pur extended series.
ax.fill_between([X_aux[index], X_aux[index+1]],
[Y_for_aux.iloc[index], Y_for_aux.iloc[index+1]],
[Y_ag_aux.iloc[index], Y_ag_aux.iloc[index+1]],
color=color, zorder = 2, alpha = 0.2, ec = None)
# --- Adjust tickers and spine to match the style of our grid
ax.xaxis.set_major_locator(ticker.MultipleLocator(2)) # ticker every 2 matchdays
xticks_ = ax.xaxis.set_ticklabels([x - 1 for x in range(0, len(X_) + 3, 2)])
ax.xaxis.set_tick_params(length = 2, color = "#4E616C", labelcolor = "#4E616C", labelsize = 6)
ax.yaxis.set_tick_params(length = 2, color = "#4E616C", labelcolor = "#4E616C", labelsize = 6)
ax.spines["bottom"].set_edgecolor("#4E616C")
5. 把功能打包成函数
上面的样子都还不错啦,接下来把这些东西都打包成一个函数。方便后面直接出图。
def plot_xG_rolling(team, ax, window = 5, color_for = "blue", color_ag = "orange", data = df):
'''
This function creates a rolling average xG plot for a given team and rolling
window.
team (str): The team's name
ax (obj): a Matplotlib axes.
window (int): The number of periods for our rolling average.
color_for (str): A hex color code for xG created.
color_af (str): A hex color code for xG conceded.
data (DataFrame): our df with the xG data.
'''
# -- Prepping the data
home_df = data.copy()
home_df = home_df.melt(id_vars = ["date", "home_team_name", "away_team_name"])
home_df["venue"] = "H"
home_df.rename(columns = {"home_team_name":"team", "away_team_name":"opponent"}, inplace = True)
home_df.replace({"variable":{"home_team_xG":"xG_for", "away_team_xG":"xG_ag"}}, inplace = True)
away_df = data.copy()
away_df = away_df.melt(id_vars = ["date", "away_team_name", "home_team_name"])
away_df["venue"] = "A"
away_df.rename(columns = {"away_team_name":"team", "home_team_name":"opponent"}, inplace = True)
away_df.replace({"variable":{"away_team_xG":"xG_for", "home_team_xG":"xG_ag"}}, inplace = True)
df = pd.concat([home_df, away_df]).reset_index(drop = True)
# ---- Filter the data
Y_for = df[(df["team"] == team) & (df["variable"] == "xG_for")]["value"].reset_index(drop = True)
Y_ag = df[(df["team"] == team) & (df["variable"] == "xG_ag")]["value"].reset_index(drop = True)
X_ = pd.Series(range(len(Y_for)))
if Y_for.shape[0] == 0:
raise ValueError(f"Team {team} is not present in the DataFrame")
# ---- Compute rolling average
Y_for = Y_for.rolling(window = 5, min_periods = 0).mean() # min_periods is for partial avg.
Y_ag = Y_ag.rolling(window = 5, min_periods = 0).mean()
# ---- Create auxiliary series for filling between curves
X_aux = X_.copy()
X_aux.index = X_aux.index * 10 # 9 aux points in between each match
last_idx = X_aux.index[-1] + 1
X_aux = X_aux.reindex(range(last_idx))
X_aux = X_aux.interpolate()
# --- Aux series for the xG created (Y_for)
Y_for_aux = Y_for.copy()
Y_for_aux.index = Y_for_aux.index * 10
last_idx = Y_for_aux.index[-1] + 1
Y_for_aux = Y_for_aux.reindex(range(last_idx))
Y_for_aux = Y_for_aux.interpolate()
# --- Aux series for the xG conceded (Y_ag)
Y_ag_aux = Y_ag.copy()
Y_ag_aux.index = Y_ag_aux.index * 10
last_idx = Y_ag_aux.index[-1] + 1
Y_ag_aux = Y_ag_aux.reindex(range(last_idx))
Y_ag_aux = Y_ag_aux.interpolate()
# --- Plotting our data
# --- Remove spines and add gridlines
ax.spines["left"].set_visible(False)
ax.spines["top"].set_visible(False)
ax.spines["right"].set_visible(False)
ax.grid(ls = "--", lw = 0.25, color = "#4E616C")
# --- The data
for_ = ax.plot(X_, Y_for, marker = "o", mfc = "white", ms = 4, color = color_for)
ag_ = ax.plot(X_, Y_ag, marker = "o", mfc = "white", ms = 4, color = color_ag)
# --- Fill between
for index in range(len(X_aux) - 1):
# Choose color based on which line's on top
if Y_for_aux.iloc[index + 1] > Y_ag_aux.iloc[index + 1]:
color = for_[0].get_color()
else:
color = ag_[0].get_color()
# Fill between the current point and the next point in pur extended series.
ax.fill_between([X_aux[index], X_aux[index+1]],
[Y_for_aux.iloc[index], Y_for_aux.iloc[index+1]],
[Y_ag_aux.iloc[index], Y_ag_aux.iloc[index+1]],
color=color, zorder = 2, alpha = 0.2, ec = None)
# --- Ensure minimum value of Y-axis is zero
ax.set_ylim(0)
# --- Adjust tickers and spine to match the style of our grid
ax.xaxis.set_major_locator(ticker.MultipleLocator(2)) # ticker every 2 matchdays
xticks_ = ax.xaxis.set_ticklabels([x - 1 for x in range(0, len(X_) + 3, 2)])
ax.xaxis.set_tick_params(length = 2, color = "#4E616C", labelcolor = "#4E616C", labelsize = 6)
ax.yaxis.set_tick_params(length = 2, color = "#4E616C", labelcolor = "#4E616C", labelsize = 6)
ax.spines["bottom"].set_edgecolor("#4E616C")
# --- Legend and team name
Y_for_last = Y_for.iloc[-1]
Y_ag_last = Y_ag.iloc[-1]
# -- Add the team's name
team_ = ax.text(
x = 0, y = ax.get_ylim()[1] + ax.get_ylim()[1]/20,
s = f'{team}',
color = "#4E616C",
va = 'center',
ha = 'left',
size = 7
)
# -- Add the xG created label
for_label_ = ax.text(
x = X_.iloc[-1] + 0.75, y = Y_for_last,
s = f'{Y_for_last:,.1f} xGF',
color = color_for,
va = 'center',
ha = 'left',
size = 6.5
)
# -- Add the xG conceded label
ag_label_ = ax.text(
x = X_.iloc[-1] + 0.75, y = Y_ag_last,
s = f'{Y_ag_last:,.1f} xGA',
color = color_ag,
va = 'center',
ha = 'left',
size = 6.5
)
6.测试函数
file_id = '1yM_F93NY4QkxjlKL3GzdcCQEnBiA2ltB'
url = f'https://drive.google.com/uc?id={file_id}'
df = pd.read_csv(url, index_col=0)
fig = plt.figure(figsize=(5, 2), dpi = 200)
ax = plt.subplot(111)
plot_xG_rolling("Sassuolo", ax, color_for = "#00A752", color_ag = "black", data = df)
plt.tight_layout()
再设置更加丰富的颜色:
fig = plt.figure(figsize=(5, 8), dpi = 200, facecolor = "#EFE9E6")
ax1 = plt.subplot(411, facecolor = "#EFE9E6")
ax2 = plt.subplot(412, facecolor = "#EFE9E6")
ax3 = plt.subplot(413, facecolor = "#EFE9E6")
ax4 = plt.subplot(414, facecolor = "#EFE9E6")
plot_xG_rolling("Sassuolo", ax1, color_for = "#00A752", color_ag = "black", data = df)
plot_xG_rolling("Lazio", ax2, color_for = "#87D8F7", color_ag = "#15366F", data = df)
plot_xG_rolling("Hellas Verona", ax3, color_for = "#153aab", color_ag = "#fdcf41", data = df)
plot_xG_rolling("Empoli", ax4, color_for = "#00579C", color_ag = "black", data = df)
plt.tight_layout()
最后
其实本文主要是对两个折线图做了一系列的优化和改进而已,主要是强调细节部分。
涉及到的matplotlib的知识,也主要是在ticks、背景颜色、fill_between部分。
来源:https://blog.csdn.net/weixin_38037405/article/details/124719333
0
投稿
猜你喜欢
- 触发器权限和所有权CREATE TRIGGER 权限默认授予定义触发器的表所有者、sysadmin 固定服务器角色成员以及 db_owner
- ASP中判断字符串中是否包含字母和数字的两个函数function isnaw(str) for
- 提到SQL Server 2005证书,很多人可能以为它只是用来在传输数据的时候起到加密作用的,但在深入了解后,你会发现它的用处还有很多。
- 笔者认为,在创建索引时要做到三个适当,即在适当的表上、适当的列上创建适当数量的索引。虽然这可以通过一句话来概括优化的索引的基本准则,但是要做
- 一、常见模型分类1.1、循环服务器模型循环接收客户端请求,处理请求。同一时刻只能处理一个请求,处理完毕后再处理下一个。优点:实现简单,占用资
- 用python写了一个简单版本的textrank,实现提取关键词的功能。import numpy as np import jieba im
- 我们可用正规表达式来寻找并替换URL和邮件地址为活动的超级链接。用到的主要函数就是InsertHyperlinks(inText),语法为:
- orm查询优化1)only与referonly方法返回的是一个queryset对象,本质就是列表套数据对象该对象内只含有only括号所指定的
- 一、题目内容给定一个非负整数 num。对于 0 ≤ i ≤ num 范围中的每个数字 i ,计算其二进制数中的
- Response是负责将信息传递给用户的对象,它可动态地响应客户端的请求,并将动态生成的响应结果返回给客户端浏览器。 一,Resp
- SQL语言共分为四大类:数据查询语言DQL,数据操纵语言DML, 数据定义语言DDL,数据控制语言DCL。其中用于定义数据的结构,比如 创建
- PHP作为开源语言,发展至今已有很多成熟的国内外开源系统,足以满足个人和企业用户自己建立WEB站点,下面则主要介绍PHP建站的流程和步骤。不
- 本文实例讲述了Laravel框架执行原生SQL语句及使用paginate分页的方法。分享给大家供大家参考,具体如下:1、运行原生sqlpub
- 本文主讲Python中Numpy数组的类型、全0全1数组的生成、随机数组、数组操作、矩阵的简单运算、矩阵的数学运算。尽管可以用python中
- 文章主要讲术了一些SQL Server新的Bug,帮您认识这些被忽略的SQL Server注入技巧。1.关于Openrowset和Opend
- 阅读上一篇:打造设计你自己的字体 ⅠMyFonts.com上销售的字体总数已经超过55,000个。现有字体的巨大数量表明了一个事实:我们在设
- PHP session用法其实很简单它可以把用户提交的数据以全局变量形式保存在一个session中并且会生成一个唯一的session_id,
- 如下所示:#encoding=utf-8#x=raw_input("Please enter a text: ")y=x
- Python continue语句:当执行到 continue 语句时,将不再执行本次循环中 continue 语句接下来的部分,而是继续下
- 下一步是将新创建的应用程序与项目相关联。为此,您需要编辑 myproj 文件夹中的 settings.py 文件,将字符串“myproj.m