8000字 | Python数据可视化,完整版实操指南 !
data:image/s3,"s3://crabby-images/9b0c3/9b0c37546c68465b1e25f9dac45f0d6fdc72081b" alt=""
1. 前言
data:image/s3,"s3://crabby-images/b588e/b588e632862dfd2dd044085c093309bd5e9601ff" alt=""
2. pandas
import pandas as pd
df = pd.read_csv('temporal.csv')
df.head(10) #View first 10 data rows
data:image/s3,"s3://crabby-images/8956d/8956dabbec8ba913b7b0c9207b487c136c0af7d4" alt=""
df.describe()
data:image/s3,"s3://crabby-images/8610a/8610a8af28c497ff47f0fd85442251e702b91275" alt=""
df.info()
data:image/s3,"s3://crabby-images/99092/99092833d77d2442802683a26150d7b1a10a1fa5" alt=""
data:image/s3,"s3://crabby-images/bcc47/bcc4720884da7b341ce720ff0bbd5e0812c4af32" alt=""
pd.set_option('display.max_rows',500)
pd.set_option('display.max_columns',500)
pd.set_option('display.width',1000)
format_dict = {'data science':'${0:,.2f}', 'Mes':'{:%m-%Y}', 'machine learning':'{:.2%}'}
#We make sure that the Month column has datetime format
df['Mes'] = pd.to_datetime(df['Mes'])
#We apply the style to the visualization
df.head().style.format(format_dict)
format_dict = {'Mes':'{:%m-%Y}'} #Simplified format dictionary with values that do make sense for our data
df.head().style.format(format_dict).highlight_max(color='darkgreen').highlight_min(color='#ff0000')
data:image/s3,"s3://crabby-images/7be3c/7be3c0f83177a16c9de1c000c4826ce92814f6fe" alt=""
df.head(10).style.format(format_dict).background_gradient(subset=['data science', 'machine learning'], cmap='BuGn')
data:image/s3,"s3://crabby-images/91850/9185094e4bd97ba650db0572aa440d52b599d281" alt=""
df.head().style.format(format_dict).bar(color='red', subset=['data science', 'deep learning'])
data:image/s3,"s3://crabby-images/4c0c1/4c0c19b41ad070cdc42abbf45c0215558b568132" alt=""
df.head(10).style.format(format_dict).background_gradient(subset = ['data science','machine learning'],cmap ='BuGn')。highlight_max(color ='yellow')
data:image/s3,"s3://crabby-images/10ca7/10ca7a0a84fef44e208a46c6c2f1650d74a7ee8e" alt=""
from pandas_profiling import ProfileReport
prof = ProfileReport(df)
prof.to_file(output_file='report.html')
data:image/s3,"s3://crabby-images/f9427/f9427b44cc1285d1b4359af4a4e66e9d590f951e" alt=""
3. matplotlib
import matplotlib.pyplot as plt
plt.plot(df['Mes'], df['data science'], label='data science')
# The parameter label is to indicate the legend. This doesn't mean that it will be shown, we'll have to use another command that I'll explain later.
data:image/s3,"s3://crabby-images/e2e27/e2e2736f1be84aff7f74bd2497b75aa57e222b31" alt=""
plt.plot(df ['Mes'],df ['data science'],label ='data science')
plt.plot(df ['Mes'],df ['machine learning'],label ='machine learning ')
plt.plot(df ['Mes'],df ['deep learning'],label ='deep learning')
data:image/s3,"s3://crabby-images/ea195/ea195b1a027eab37a6c593694d9691c128796591" alt=""
plt.plot(df['Mes'], df['data science'], label='data science')
plt.plot(df['Mes'], df['machine learning'], label='machine learning')
plt.plot(df['Mes'], df['deep learning'], label='deep learning')
plt.xlabel('Date')
plt.ylabel('Popularity')
plt.title('Popularity of AI terms by date')
plt.grid(True)
plt.legend()
data:image/s3,"s3://crabby-images/b6aca/b6aca838e5ac3b88d6a262836b8ef532e1dc5587" alt=""
fig, axes = plt.subplots(2,2)
axes[0, 0].hist(df['data science'])
axes[0, 1].scatter(df['Mes'], df['data science'])
axes[1, 0].plot(df['Mes'], df['machine learning'])
axes[1, 1].plot(df['Mes'], df['deep learning'])
data:image/s3,"s3://crabby-images/f7b6b/f7b6b7158c41fd9921ecab782ee80974f3af6c35" alt=""
plt.plot(df ['Mes'],df ['data science'],'r-')
plt.plot(df ['Mes'],df ['data science'] * 2,'bs')
plt .plot(df ['Mes'],df ['data science'] * 3,'g ^')
data:image/s3,"s3://crabby-images/04880/0488009c4443e5bb55145fc1e9477597ada4fa9f" alt=""
plt.scatter(df['data science'], df['machine learning'])
data:image/s3,"s3://crabby-images/d271f/d271fd7b1412224d3817991e10e1850e3fa39742" alt=""
plt.bar(df ['Mes'],df ['machine learning'],width = 20)
data:image/s3,"s3://crabby-images/6cb85/6cb853fa7f8a37bdf4a8c8cf3c8b512f4ec12b63" alt=""
plt.hist(df ['deep learning'],bins = 15)
data:image/s3,"s3://crabby-images/19c21/19c214329f98833296a8f9bb54ac2aa85a46fa45" alt=""
plt.plot(df['Mes'], df['data science'], label='data science')
plt.plot(df['Mes'], df['machine learning'], label='machine learning')
plt.plot(df['Mes'], df['deep learning'], label='deep learning')
plt.xlabel('Date')
plt.ylabel('Popularity')
plt.title('Popularity of AI terms by date')
plt.grid(True)
plt.text(x='2010-01-01', y=80, s=r'$\lambda=1, r^2=0.8$') #Coordinates use the same units as the graph
plt.annotate('Notice something?', xy=('2014-01-01', 30), xytext=('2006-01-01', 50), arrowprops={'facecolor':'red', 'shrink':0.05}
data:image/s3,"s3://crabby-images/242e8/242e866b9c53206562b83f34f6ac4cd533487a31" alt=""
4. seaborn
import seaborn as sns
sns.set()
sns.scatterplot(df['Mes'], df['data science'])
data:image/s3,"s3://crabby-images/204bc/204bc4dfb31666a9b844aa4bbdd27b48e54ed544" alt=""
sns.relplot(x='Mes', y='deep learning', hue='data science', size='machine learning', col='categorical', data=df)
data:image/s3,"s3://crabby-images/f998d/f998d5109148d663dadebe14f8a59f1b96250725" alt=""
sns.heatmap(df.corr(),annot = True,fmt ='。2f')
data:image/s3,"s3://crabby-images/8920d/8920dcc96015cb9a19c2f74935f55c1bcbaa6b24" alt=""
sns.pairplot(df)
data:image/s3,"s3://crabby-images/f2d68/f2d681a1ff7ff16fa1a1bc449d03b5a9b31c918f" alt=""
sns.pairplot(df,hue ='categorical')
data:image/s3,"s3://crabby-images/14b86/14b865110be588403642a9caaaa7ceb3bc8f564e" alt=""
sns.jointplot(x='data science', y='machine learning', data=df)
data:image/s3,"s3://crabby-images/a809c/a809c46fab50b23a95c08a4e34dde0632cf9979d" alt=""
sns.catplot(x='categorical', y='data science', kind='violin', data=df)
data:image/s3,"s3://crabby-images/681d3/681d36f7f3a06ce8971b88c24bc1647900a02da3" alt=""
fig, axes = plt.subplots(1, 2, sharey=True, figsize=(8, 4))
sns.scatterplot(x="Mes", y="deep learning", hue="categorical", data=df, ax=axes[0])
axes[0].set_title('Deep Learning')
sns.scatterplot(x="Mes", y="machine learning", hue="categorical", data=df, ax=axes[1])
axes[1].set_title('Machine Learning')
data:image/s3,"s3://crabby-images/56144/5614411c7665229b5482d9115bfcc1f0bea8fdf9" alt=""
5. Bokeh
from bokeh.plotting import figure, output_file, save
output_file('data_science_popularity.html')
p = figure(title='data science', x_axis_label='Mes', y_axis_label='data science')
p.line(df['Mes'], df['data science'], legend='popularity', line_width=2)
save(p)
data:image/s3,"s3://crabby-images/95214/95214634a8e94e3c9093adcc78891eea0416cc66" alt=""
output_file('multiple_graphs.html')
s1 = figure(width=250, plot_height=250, title='data science')
s1.circle(df['Mes'], df['data science'], size=10, color='navy', alpha=0.5)
s2 = figure(width=250, height=250, x_range=s1.x_range, y_range=s1.y_range, title='machine learning') #share both axis range
s2.triangle(df['Mes'], df['machine learning'], size=10, color='red', alpha=0.5)
s3 = figure(width=250, height=250, x_range=s1.x_range, title='deep learning') #share only one axis range
s3.square(df['Mes'], df['deep learning'], size=5, color='green', alpha=0.5)
p = gridplot([[s1, s2, s3]])
save(p)
data:image/s3,"s3://crabby-images/5c315/5c3152479025a92e569b8423d4fbc1d33d72f657" alt=""
6. altair
7. folium
import folium
m1 = folium.Map(location=[41.38, 2.17], tiles='openstreetmap', zoom_start=18)
m1.save('map1.html')
data:image/s3,"s3://crabby-images/5d7a0/5d7a0693e02cf0754586b1d0eabcfd4c5814b4eb" alt=""
m2 = folium.Map(location=[41.38, 2.17], tiles='openstreetmap', zoom_start=16)
folium.Marker([41.38, 2.176], popup='<i>You can use whatever HTML code you want</i>', tooltip='click here').add_to(m2)
folium.Marker([41.38, 2.174], popup='<b>You can use whatever HTML code you want</b>', tooltip='dont click here').add_to(m2)
m2.save('map2.html')
data:image/s3,"s3://crabby-images/d0048/d004855abdc48774286baf2069e641d56a8b15e0" alt=""
from geopandas.tools import geocode
df2 = pd.read_csv('mapa.csv')
df2.dropna(axis=0, inplace=True)
df2['geometry'] = geocode(df2['País'], provider='nominatim')['geometry'] #It may take a while because it downloads a lot of data.
df2['Latitude'] = df2['geometry'].apply(lambda l: l.y)
df2['Longitude'] = df2['geometry'].apply(lambda l: l.x)
data:image/s3,"s3://crabby-images/6023b/6023b71eb664b3568d6e5724e2bf67254dab571e" alt=""
m3 = folium.Map(location=[39.326234,-4.838065], tiles='openstreetmap', zoom_start=3)
def color_producer(val):
if val <= 50:
return 'red'
else:
return 'green'
for i in range(0,len(df2)):
folium.Circle(location=[df2.iloc[i]['Latitud'], df2.iloc[i]['Longitud']], radius=5000*df2.iloc[i]['data science'], color=color_producer(df2.iloc[i]['data science'])).add_to(m3)
m3.save('map3.html')
data:image/s3,"s3://crabby-images/c959c/c959c46e3d09fd7fee4865313c971a6d696cfcd4" alt=""
- EOF -
推荐阅读:
评论