8000字 | Python数据可视化,完整版实操指南 !
点击“简说Python”,选择“置顶/星标公众号”
福利干货,第一时间送达
1. 前言
data:image/s3,"s3://crabby-images/3fa90/3fa90227cd3eed1d3458e58782161161c258800e" alt=""
2. pandas
import pandas as pd
df = pd.read_csv('temporal.csv')
df.head(10) #View first 10 data rows
data:image/s3,"s3://crabby-images/ec4c8/ec4c8138be57b4a36895f91c9f0483725d39e35f" alt=""
df.describe()
data:image/s3,"s3://crabby-images/7a4d1/7a4d150d669072f81fd4cc01298fae36bdfb9719" alt=""
df.info()
data:image/s3,"s3://crabby-images/5e7a0/5e7a05b99d3a12998f613f7d3e4cbd3944b9f0ee" alt=""
data:image/s3,"s3://crabby-images/d6fc5/d6fc5946b1668ca7e11d7ef31632c351c28ad0cd" alt=""
pd.set_option('display.max_rows',500)
pd.set_option('display.max_columns',500)
pd.set_option('display.width',1000)
format_dict = {'data science':'${0:,.2f}', 'Mes':'{:%m-%Y}', 'machine learning':'{:.2%}'}
#We make sure that the Month column has datetime format
df['Mes'] = pd.to_datetime(df['Mes'])
#We apply the style to the visualization
df.head().style.format(format_dict)
format_dict = {'Mes':'{:%m-%Y}'} #Simplified format dictionary with values that do make sense for our data
df.head().style.format(format_dict).highlight_max(color='darkgreen').highlight_min(color='#ff0000')
data:image/s3,"s3://crabby-images/67558/675581b0fc86650b79559777843be680d005b665" alt=""
df.head(10).style.format(format_dict).background_gradient(subset=['data science', 'machine learning'], cmap='BuGn')
data:image/s3,"s3://crabby-images/6d5b4/6d5b467197ced9071abd27dd476775d29bf3f77d" alt=""
df.head().style.format(format_dict).bar(color='red', subset=['data science', 'deep learning'])
data:image/s3,"s3://crabby-images/14a1c/14a1c9ee97b5fc8f28d59f2ca78bc745f63981f1" alt=""
df.head(10).style.format(format_dict).background_gradient(subset = ['data science','machine learning'],cmap ='BuGn')。highlight_max(color ='yellow')
data:image/s3,"s3://crabby-images/08c37/08c370b76cc568ebffd76de745cc8221eb074d6a" alt=""
from pandas_profiling import ProfileReport
prof = ProfileReport(df)
prof.to_file(output_file='report.html')
data:image/s3,"s3://crabby-images/cccfc/cccfce23deff981212e2a0aaa802a948bcf18ffc" alt=""
3. matplotlib
import matplotlib.pyplot as plt
plt.plot(df['Mes'], df['data science'], label='data science')
# The parameter label is to indicate the legend. This doesn't mean that it will be shown, we'll have to use another command that I'll explain later.
data:image/s3,"s3://crabby-images/2094b/2094ba801af3e105df70499116412e9ee967e223" alt=""
plt.plot(df ['Mes'],df ['data science'],label ='data science')
plt.plot(df ['Mes'],df ['machine learning'],label ='machine learning ')
plt.plot(df ['Mes'],df ['deep learning'],label ='deep learning')
data:image/s3,"s3://crabby-images/9210c/9210c3c9fa70b73c29a90e26e4d6b9213f188294" alt=""
plt.plot(df['Mes'], df['data science'], label='data science')
plt.plot(df['Mes'], df['machine learning'], label='machine learning')
plt.plot(df['Mes'], df['deep learning'], label='deep learning')
plt.xlabel('Date')
plt.ylabel('Popularity')
plt.title('Popularity of AI terms by date')
plt.grid(True)
plt.legend()
data:image/s3,"s3://crabby-images/1231d/1231da96fd2bb7c06e3efdaf180646bb59db5692" alt=""
fig, axes = plt.subplots(2,2)
axes[0, 0].hist(df['data science'])
axes[0, 1].scatter(df['Mes'], df['data science'])
axes[1, 0].plot(df['Mes'], df['machine learning'])
axes[1, 1].plot(df['Mes'], df['deep learning'])
data:image/s3,"s3://crabby-images/d4ab2/d4ab2ce56ac0dae8e24b572d59a2fdd3fefaad0c" alt=""
plt.plot(df ['Mes'],df ['data science'],'r-')
plt.plot(df ['Mes'],df ['data science'] * 2,'bs')
plt .plot(df ['Mes'],df ['data science'] * 3,'g ^')
data:image/s3,"s3://crabby-images/2d23e/2d23e5a2d01b18c4d4a9bfd0a53941309b2cf663" alt=""
plt.scatter(df['data science'], df['machine learning'])
data:image/s3,"s3://crabby-images/3a188/3a188bf24cad3db1b1a391b35d62773018cbdd0c" alt=""
plt.bar(df ['Mes'],df ['machine learning'],width = 20)
data:image/s3,"s3://crabby-images/0648e/0648e21aef817e49479d75261c3b3834a336128d" alt=""
plt.hist(df ['deep learning'],bins = 15)
data:image/s3,"s3://crabby-images/ba7db/ba7dbf18fe43c7b1a9fc0b17ec97d5fbe08823bc" alt=""
plt.plot(df['Mes'], df['data science'], label='data science')
plt.plot(df['Mes'], df['machine learning'], label='machine learning')
plt.plot(df['Mes'], df['deep learning'], label='deep learning')
plt.xlabel('Date')
plt.ylabel('Popularity')
plt.title('Popularity of AI terms by date')
plt.grid(True)
plt.text(x='2010-01-01', y=80, s=r'$\lambda=1, r^2=0.8$') #Coordinates use the same units as the graph
plt.annotate('Notice something?', xy=('2014-01-01', 30), xytext=('2006-01-01', 50), arrowprops={'facecolor':'red', 'shrink':0.05}
data:image/s3,"s3://crabby-images/52d6e/52d6ee003f066985bd4ac4011a2dd5fd7b262744" alt=""
4. seaborn
import seaborn as sns
sns.set()
sns.scatterplot(df['Mes'], df['data science'])
data:image/s3,"s3://crabby-images/94aef/94aef5c2e0d04c44e4366fc3ce0c0780271af60e" alt=""
sns.relplot(x='Mes', y='deep learning', hue='data science', size='machine learning', col='categorical', data=df)
data:image/s3,"s3://crabby-images/a8422/a8422510f42a38aecc7fc1158cce2e04b49aacc6" alt=""
sns.heatmap(df.corr(),annot = True,fmt ='。2f')
data:image/s3,"s3://crabby-images/e028e/e028e6fd70e341c0a0d3b834e4dfec4087815701" alt=""
sns.pairplot(df)
data:image/s3,"s3://crabby-images/55d14/55d142ae6c4387e00d4c4cfb41563e202a1ea0b8" alt=""
sns.pairplot(df,hue ='categorical')
data:image/s3,"s3://crabby-images/9071b/9071b11ae1e5527a1012366dea67385d9d610f61" alt=""
sns.jointplot(x='data science', y='machine learning', data=df)
data:image/s3,"s3://crabby-images/5cdbf/5cdbf968bf20d2173643a4265d8bc1902204638a" alt=""
sns.catplot(x='categorical', y='data science', kind='violin', data=df)
data:image/s3,"s3://crabby-images/2990a/2990a9ae0f09dfc74574b075e0e25d2ff4bdb781" alt=""
fig, axes = plt.subplots(1, 2, sharey=True, figsize=(8, 4))
sns.scatterplot(x="Mes", y="deep learning", hue="categorical", data=df, ax=axes[0])
axes[0].set_title('Deep Learning')
sns.scatterplot(x="Mes", y="machine learning", hue="categorical", data=df, ax=axes[1])
axes[1].set_title('Machine Learning')
data:image/s3,"s3://crabby-images/e81d6/e81d6d08987ee54bf8950a0d4a8a462ffb252fa2" alt=""
5. Bokeh
from bokeh.plotting import figure, output_file, save
output_file('data_science_popularity.html')
p = figure(title='data science', x_axis_label='Mes', y_axis_label='data science')
p.line(df['Mes'], df['data science'], legend='popularity', line_width=2)
save(p)
data:image/s3,"s3://crabby-images/60ebe/60ebe14c7a1b51c532763930c06c9d3e36ffddee" alt=""
output_file('multiple_graphs.html')
s1 = figure(width=250, plot_height=250, title='data science')
s1.circle(df['Mes'], df['data science'], size=10, color='navy', alpha=0.5)
s2 = figure(width=250, height=250, x_range=s1.x_range, y_range=s1.y_range, title='machine learning') #share both axis range
s2.triangle(df['Mes'], df['machine learning'], size=10, color='red', alpha=0.5)
s3 = figure(width=250, height=250, x_range=s1.x_range, title='deep learning') #share only one axis range
s3.square(df['Mes'], df['deep learning'], size=5, color='green', alpha=0.5)
p = gridplot([[s1, s2, s3]])
save(p)
data:image/s3,"s3://crabby-images/14565/14565b77810d02789dfc1223494125b0f174742a" alt=""
6. altair
7. folium
import folium
m1 = folium.Map(location=[41.38, 2.17], tiles='openstreetmap', zoom_start=18)
m1.save('map1.html')
data:image/s3,"s3://crabby-images/fbcf4/fbcf49ee08300b0b6e9ae25499d9d3a0194b00e8" alt=""
m2 = folium.Map(location=[41.38, 2.17], tiles='openstreetmap', zoom_start=16)
folium.Marker([41.38, 2.176], popup='<i>You can use whatever HTML code you want</i>', tooltip='click here').add_to(m2)
folium.Marker([41.38, 2.174], popup='<b>You can use whatever HTML code you want</b>', tooltip='dont click here').add_to(m2)
m2.save('map2.html')
data:image/s3,"s3://crabby-images/a392e/a392e8e4f4e06428677035642b39fe3e265028ee" alt=""
from geopandas.tools import geocode
df2 = pd.read_csv('mapa.csv')
df2.dropna(axis=0, inplace=True)
df2['geometry'] = geocode(df2['País'], provider='nominatim')['geometry'] #It may take a while because it downloads a lot of data.
df2['Latitude'] = df2['geometry'].apply(lambda l: l.y)
df2['Longitude'] = df2['geometry'].apply(lambda l: l.x)
data:image/s3,"s3://crabby-images/f580a/f580af192635b03b1df44a5f71af6ec2c539fa2c" alt=""
m3 = folium.Map(location=[39.326234,-4.838065], tiles='openstreetmap', zoom_start=3)
def color_producer(val):
if val <= 50:
return 'red'
else:
return 'green'
for i in range(0,len(df2)):
folium.Circle(location=[df2.iloc[i]['Latitud'], df2.iloc[i]['Longitud']], radius=5000*df2.iloc[i]['data science'], color=color_producer(df2.iloc[i]['data science'])).add_to(m3)
m3.save('map3.html')
data:image/s3,"s3://crabby-images/ad503/ad503f2787d420bc081142bc3e335b4d4f9cb1b2" alt=""
扫码即可加我微信
即可获取最新学习资源
学习更多: 整理了我开始分享学习笔记到现在超过250篇优质文章,涵盖数据分析、爬虫、机器学习等方面,别再说不知道该从哪开始,实战哪里找了
“点赞”传统美德不能丢
评论