4000字,一篇 Python 数据可视化 "保姆级" 攻略!
↑ 关注 + 星标 ,每天学Python新技能
后台回复【大礼包】送你Python自学大礼包
2. pandas
import pandas as pd
df = pd.read_csv('temporal.csv')
df.head(10) #View first 10 data rows
data:image/s3,"s3://crabby-images/6a37f/6a37fb67bb0bf629f5d24bad46d01e22c4f8b5e9" alt=""
df.describe()
data:image/s3,"s3://crabby-images/eb85b/eb85b656a1429dbfd11f6e0409497eb6264d19e1" alt=""
df.info()
data:image/s3,"s3://crabby-images/d3c6c/d3c6ca8a48f095a6ecbbd17d7bb4f43f4951a5d1" alt=""
data:image/s3,"s3://crabby-images/146cb/146cb6f2761e2dd4525528f4b8761fb2aa892cd3" alt=""
pd.set_option('display.max_rows',500)
pd.set_option('display.max_columns',500)
pd.set_option('display.width',1000)
format_dict = {'data science':'${0:,.2f}', 'Mes':'{:%m-%Y}', 'machine learning':'{:.2%}'}
#We make sure that the Month column has datetime format
df['Mes'] = pd.to_datetime(df['Mes'])
#We apply the style to the visualization
df.head().style.format(format_dict)
format_dict = {'Mes':'{:%m-%Y}'} #Simplified format dictionary with values that do make sense for our data
df.head().style.format(format_dict).highlight_max(color='darkgreen').highlight_min(color='#ff0000')
data:image/s3,"s3://crabby-images/998ec/998ec1d5bd8e14c172d4968ed54e6b4de770b8a4" alt=""
df.head(10).style.format(format_dict).background_gradient(subset=['data science', 'machine learning'], cmap='BuGn')
data:image/s3,"s3://crabby-images/6b64d/6b64dac5889db25de8c0ad2f9f49e66e42d2b0e7" alt=""
df.head().style.format(format_dict).bar(color='red', subset=['data science', 'deep learning'])
data:image/s3,"s3://crabby-images/1a8bb/1a8bbd6dcac6be90cf9acebd7b1875abd1af3aff" alt=""
df.head(10).style.format(format_dict).background_gradient(subset = ['data science','machine learning'],cmap ='BuGn')。highlight_max(color ='yellow')
data:image/s3,"s3://crabby-images/5c2da/5c2dae5c200d3bb1af9d489d2d94827766b8fc50" alt=""
from pandas_profiling import ProfileReport
prof = ProfileReport(df)
prof.to_file(output_file='report.html')
data:image/s3,"s3://crabby-images/7e40f/7e40f96f06a0ee6970d218da3c2b2e3a99ca40ec" alt=""
3. matplotlib
import matplotlib.pyplot as plt
plt.plot(df['Mes'], df['data science'], label='data science')
# The parameter label is to indicate the legend. This doesn't mean that it will be shown, we'll have to use another command that I'll explain later.
data:image/s3,"s3://crabby-images/d19f2/d19f2e9dad0cec6e032293c22e2d7376f7f092ec" alt=""
plt.plot(df ['Mes'],df ['data science'],label ='data science')
plt.plot(df ['Mes'],df ['machine learning'],label ='machine learning ')
plt.plot(df ['Mes'],df ['deep learning'],label ='deep learning')
data:image/s3,"s3://crabby-images/75106/75106e42e5eafcbe4c634ef4ecd2e49232356c3d" alt=""
plt.plot(df['Mes'], df['data science'], label='data science')
plt.plot(df['Mes'], df['machine learning'], label='machine learning')
plt.plot(df['Mes'], df['deep learning'], label='deep learning')
plt.xlabel('Date')
plt.ylabel('Popularity')
plt.title('Popularity of AI terms by date')
plt.grid(True)
plt.legend()
data:image/s3,"s3://crabby-images/10251/10251d7ac837f869a96b940cfc9cf17062fca492" alt=""
fig, axes = plt.subplots(2,2)
axes[0, 0].hist(df['data science'])
axes[0, 1].scatter(df['Mes'], df['data science'])
axes[1, 0].plot(df['Mes'], df['machine learning'])
axes[1, 1].plot(df['Mes'], df['deep learning'])
data:image/s3,"s3://crabby-images/fac78/fac78d9bbdb30b1e7a9574325f0bc755ff0c68fe" alt=""
plt.plot(df ['Mes'],df ['data science'],'r-')
plt.plot(df ['Mes'],df ['data science'] * 2,'bs')
plt .plot(df ['Mes'],df ['data science'] * 3,'g ^')
data:image/s3,"s3://crabby-images/45f26/45f266c8a447e90501cee4dab097a29fbc7531b4" alt=""
plt.scatter(df['data science'], df['machine learning'])
data:image/s3,"s3://crabby-images/29760/2976049785e79a2448d45baa76d91c389a9db01e" alt=""
plt.bar(df ['Mes'],df ['machine learning'],width = 20)
data:image/s3,"s3://crabby-images/4d754/4d7542762878e15942627b80b5f339b1595dab18" alt=""
plt.hist(df ['deep learning'],bins = 15)
data:image/s3,"s3://crabby-images/6c44d/6c44d59b02581aa1d2652fb258284ed3b9b1c695" alt=""
plt.plot(df['Mes'], df['data science'], label='data science')
plt.plot(df['Mes'], df['machine learning'], label='machine learning')
plt.plot(df['Mes'], df['deep learning'], label='deep learning')
plt.xlabel('Date')
plt.ylabel('Popularity')
plt.title('Popularity of AI terms by date')
plt.grid(True)
plt.text(x='2010-01-01', y=80, s=r'$\lambda=1, r^2=0.8$') #Coordinates use the same units as the graph
plt.annotate('Notice something?', xy=('2014-01-01', 30), xytext=('2006-01-01', 50), arrowprops={'facecolor':'red', 'shrink':0.05}
data:image/s3,"s3://crabby-images/4c908/4c908df727e1cd207b50f0ffabb55fcd1bd15ae7" alt=""
4. seaborn
import seaborn as sns
sns.set()
sns.scatterplot(df['Mes'], df['data science'])
data:image/s3,"s3://crabby-images/eaba1/eaba1656708319361997ce9efc6faaa5dfb417d9" alt=""
sns.relplot(x='Mes', y='deep learning', hue='data science', size='machine learning', col='categorical', data=df)
data:image/s3,"s3://crabby-images/a2698/a2698caa8f20da3cf80c99a8a5977e89607a2b8e" alt=""
sns.heatmap(df.corr(),annot = True,fmt ='。2f')
data:image/s3,"s3://crabby-images/a5545/a5545f2e090fc492df53bd5e0c2ffcb6c6d9dfe7" alt=""
sns.pairplot(df)
data:image/s3,"s3://crabby-images/15e61/15e61751e7279e7a7507f2f1e41ea1d99ae7093f" alt=""
sns.pairplot(df,hue ='categorical')
data:image/s3,"s3://crabby-images/67a28/67a2875b97124be5cf8fde9d513b9519773995f9" alt=""
sns.jointplot(x='data science', y='machine learning', data=df)
data:image/s3,"s3://crabby-images/99449/9944972c6c6baad365d60082304468d7052d5de9" alt=""
sns.catplot(x='categorical', y='data science', kind='violin', data=df)
data:image/s3,"s3://crabby-images/69c75/69c75e85e398d32727ceeabeaaa60cbf423b5fb8" alt=""
fig, axes = plt.subplots(1, 2, sharey=True, figsize=(8, 4))
sns.scatterplot(x="Mes", y="deep learning", hue="categorical", data=df, ax=axes[0])
axes[0].set_title('Deep Learning')
sns.scatterplot(x="Mes", y="machine learning", hue="categorical", data=df, ax=axes[1])
axes[1].set_title('Machine Learning')
data:image/s3,"s3://crabby-images/701b4/701b493ac1de075d5316feac2e46511049e7ffbd" alt=""
5. Bokeh
from bokeh.plotting import figure, output_file, save
output_file('data_science_popularity.html')
p = figure(title='data science', x_axis_label='Mes', y_axis_label='data science')
p.line(df['Mes'], df['data science'], legend='popularity', line_width=2)
save(p)
data:image/s3,"s3://crabby-images/373e7/373e7239055fd504c573be6f46c44e6f1b96dc05" alt=""
output_file('multiple_graphs.html')
s1 = figure(width=250, plot_height=250, title='data science')
s1.circle(df['Mes'], df['data science'], size=10, color='navy', alpha=0.5)
s2 = figure(width=250, height=250, x_range=s1.x_range, y_range=s1.y_range, title='machine learning') #share both axis range
s2.triangle(df['Mes'], df['machine learning'], size=10, color='red', alpha=0.5)
s3 = figure(width=250, height=250, x_range=s1.x_range, title='deep learning') #share only one axis range
s3.square(df['Mes'], df['deep learning'], size=5, color='green', alpha=0.5)
p = gridplot([[s1, s2, s3]])
save(p)
data:image/s3,"s3://crabby-images/91923/919232a7afe32fa24c5ac4161cb2379b1d20df74" alt=""
6. altair
7. folium
import folium
m1 = folium.Map(location=[41.38, 2.17], tiles='openstreetmap', zoom_start=18)
m1.save('map1.html')
data:image/s3,"s3://crabby-images/53534/53534a7f04848f6705c4923833e9f4a94a83a7ae" alt=""
m2 = folium.Map(location=[41.38, 2.17], tiles='openstreetmap', zoom_start=16)
folium.Marker([41.38, 2.176], popup='You can use whatever HTML code you want', tooltip='click here').add_to(m2)
folium.Marker([41.38, 2.174], popup='You can use whatever HTML code you want', tooltip='dont click here').add_to(m2)
m2.save('map2.html')
data:image/s3,"s3://crabby-images/f5494/f54949c8f858e7eb34326f6eaf16a1cb2e0efd1c" alt=""
from geopandas.tools import geocode
df2 = pd.read_csv('mapa.csv')
df2.dropna(axis=0, inplace=True)
df2['geometry'] = geocode(df2['País'], provider='nominatim')['geometry'] #It may take a while because it downloads a lot of data.
df2['Latitude'] = df2['geometry'].apply(lambda l: l.y)
df2['Longitude'] = df2['geometry'].apply(lambda l: l.x)
data:image/s3,"s3://crabby-images/2a6d3/2a6d3f52f79c1ca5327946853525fed4ab3d32e0" alt=""
m3 = folium.Map(location=[39.326234,-4.838065], tiles='openstreetmap', zoom_start=3)
def color_producer(val):
if val <= 50:
return 'red'
else:
return 'green'
for i in range(0,len(df2)):
folium.Circle(location=[df2.iloc[i]['Latitud'], df2.iloc[i]['Longitud']], radius=5000*df2.iloc[i]['data science'], color=color_producer(df2.iloc[i]['data science'])).add_to(m3)
m3.save('map3.html')
data:image/s3,"s3://crabby-images/8c4a6/8c4a637b71d9e00d49b256f6cfc47186237e6f56" alt=""
推荐阅读
评论