引き続きUdemyでPython for Time Series Data Analysisで、特にDataの可視化方法を学習する。便利で高機能なライブラリが利用でき、pandasからすぐにplotが可能。
Dataの整形
import pandas as pd pop = pd.read_csv('./UDEMY_TSA_FINAL/Data/population_by_county.csv') pop.head() pop.columns pop['State'].unique() pop['State'].unique() pop['County'].value_counts().head() pop.sort_values('2010Census',ascending=False).head() pop.groupby('State').sum().sort_values('2010Census',ascending=False).head() sum(pop['2010Census']>1000000) def check_county(name): return "County" not in name myser = pop['County'].apply(lambda name: "County" not in name) myser.value_counts() pop['PercentChange'] = 100*(pop['2017PopEstimate'] - pop['2010Census'])/(pop['2010Census']) pop.head() states = pop.groupby('State').sum() states['PercentChange'] = 100*(states['2017PopEstimate'] - states['2010Census'])/states['2010Census'] states.sort_values('PercentChange',ascending=False).head()
data:image/s3,"s3://crabby-images/1e5ea/1e5ead25b0d8cfc19542cd25e9af74fd18c020f0" alt=""
ヒストグラムのプロット例
import pandas as pd df1 = pd.read_csv('./UDEMY_TSA_FINAL/03-Pandas-Visualization/df1.csv',index_col=0) df1.head() df2 = pd.read_csv('./UDEMY_TSA_FINAL/03-Pandas-Visualization/df2.csv') df2 df1['A'].plot.hist()
data:image/s3,"s3://crabby-images/408c6/408c6c819621d35121417d93a47c8f58fb7d0f41" alt=""
df1['A'].plot.hist(bins=80,edgecolor='k').autoscale(enable=True,axis='both',tight=True)
data:image/s3,"s3://crabby-images/a38b3/a38b3b67c739b0acde2b3b715011011e03942b41" alt=""
f1['A'].plot.hist(grid=True)
data:image/s3,"s3://crabby-images/1fa24/1fa24456655172f281d5151412e8488972ff2ad0" alt=""
ラインプロットの例
df2.plot.line(y=['a','b','c'],figsize=(10,4),lw=4)
data:image/s3,"s3://crabby-images/23d39/23d39f7a6f1e19d44e5e3915119ac315a96ffcc9" alt=""
散布図の例
df1.plot.scatter(x='A',y='B')
data:image/s3,"s3://crabby-images/a9a91/a9a914eee2c2f15cce50d0b09bccf5c342297708" alt=""
df1.plot.scatter(x='A',y='B',c='D',cmap='coolwarm')
data:image/s3,"s3://crabby-images/1d4f8/1d4f8dafc53cbb23537f23872f8ebbe81aecc857" alt=""
df1.plot.scatter(x=’A’,y=’B’,c=’D’,s=df1[‘C’]*50,alpha=0.3)
data:image/s3,"s3://crabby-images/91b1b/91b1b3e4244d540851ea5708ae442933bb0db96d" alt=""
ボックスプロットの例
df2.plot.box()
data:image/s3,"s3://crabby-images/f6ead/f6ead2a2c22f9cc0203455566bd0f2f8c3ac5ec1" alt=""
密度分布プロットの例
df2.plot.kde()
data:image/s3,"s3://crabby-images/8d8ce/8d8ce58f93512c55cfc40ae8ad704e4a671c44f2" alt=""
import numpy as np df = pd.DataFrame(np.random.randn(1000,2),columns=['a','b']) df.plot.scatter(x='a',y='b')
data:image/s3,"s3://crabby-images/6415d/6415de1a986e19a22efa0c415584b536e66aa8aa" alt=""
data:image/s3,"s3://crabby-images/4d387/4d3874d8c2d009b7e34244ec3ae0e8028a0f8e6c" alt=""
様々なプロットの設定変更
df2['c'].plot.line(figsize=(10,3),ls=':',c='red',lw=5)
data:image/s3,"s3://crabby-images/75bc4/75bc460c843b59e6344e95b8c381f4c0cd9e0d59" alt=""
title = "MY PLOT TITLE" xlabel = 'My X Data' ylabel = 'My Y Data' ax = df2['c'].plot.line(figsize=(10,3),ls=':',c='red',lw=5,title=title) ax.set(xlabel=xlabel,ylabel=ylabel)
data:image/s3,"s3://crabby-images/eec01/eec01820b3ed30142e62b5429a8533ead687982f" alt=""
ax = df2.plot() ax.legend(loc=0,bbox_to_anchor=(1.0,1.0))
data:image/s3,"s3://crabby-images/92b66/92b665e89b5090c10423cdd21d3176bc1a0731e3" alt=""
import pandas as pd df3 = pd.read_csv('./UDEMY_TSA_FINAL/03-Pandas-Visualization/df3.csv') print(len(df3)) print(df3.head()) df3.plot.scatter(x='produced',y='defective',c='red',figsize=(12,3),s=3)
data:image/s3,"s3://crabby-images/994db/994dbca8be27ef17e3412106a2448f8bbe5cc5c9" alt=""
df3['produced'].plot.hist() df3['produced'].plot.hist(edgecolor='k').autoscale(axis='x',tight=True)
data:image/s3,"s3://crabby-images/57806/578063c2c10d3de18acb4b67f1826ec6b364bc56" alt=""
df3[['weekday','produced']].boxplot(by='weekday',figsize=(12,10))
data:image/s3,"s3://crabby-images/2fd5b/2fd5ba48720dbb819dd83045ce86ebd51d6fbf43" alt=""
df3['defective'].plot.kde(ls='--',lw=5)
data:image/s3,"s3://crabby-images/b953d/b953d47c0967e5491808749d2d4ea4a927caeb8d" alt=""
df3.loc[0:30].plot.area(stacked=False,alpha=0.4) ax.legend(loc=0,bbox_to_anchor=(1.3,0.5))
data:image/s3,"s3://crabby-images/90d1e/90d1e8eed3d7ee4dfe76747783b1cf1a169d33ca" alt=""