#視覺化
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
plt.style.use('ggplot')
df1=pd.read_csv("2012MLB.csv",encoding="big5")
df1.head()
#直方圖(Histogram)
plt.hist(df1['HR'],bins=[0,10,20,30,50,100,200,300])
plt.show()
#長條圖 x 跟 y 數量要一致
x=[1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30]
y=df1['HR']
plt.bar(x,y,align='center')
plt.show()
#散布圖
plt.scatter(df1['H'],df1['HR'],color='blue')
plt.show()
#箱型圖 showfliers=False 是否放入離群植
plt.boxplot(df1['H'], showfliers=True)
plt.show()
#圓餅圖
Y=df1.loc[0:5,'Team']
X=df1.loc[0:5,'HR']
plt.pie(X,labels=Y)
plt.show()
#進階
#折線圖 放兩張
df1
x=df1.loc[0:5,'H']
y=df1.loc[0:5,'R']
x1=df1.loc[0:5,'H']
y1=df1.loc[0:5,'RBI']
plt.plot(x,y,'-')
plt.plot(x1,y1,'-')
plt.show()
#做圖風格
#查看所有的風格選擇:print(plt.style.available)
#使⽤作圖風格:plt.style.use(‘風格名稱')
#標題 刻度
plt.rcParams['font.family']='SimHei' #⿊體
plt.title
plt.hist(df1['HR'],bins=[0,10,20,30,50,100,200,300],color='blue')
plt.title('MLB2012')
plt.xlabel('分箱')
plt.ylabel('HR')
plt.show()
#雙圖和一
y=df1.loc[0:5,'HR']
x=[1,2,3,4,5,6]
ax1 = plt.subplot(211)
plt.plot(x,y,color='blue',linestyle='--')
plt.xlabel('分箱')
plt.ylabel('HR')
plt.setp(ax1.get_xticklabels(), visible=False)
plt.subplot(212,sharex=ax1)
plt.bar(x,y,align='center')
plt.xlabel('分箱')
plt.ylabel('HR')
plt.show()
#Pandas 視覺化
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
plt.rcParams['font.family']='SimHei' #⿊體
plt.style.use('ggplot')
df1=pd.read_csv("2012MLB.csv",encoding="big5")
df1
df2=df1.loc[0:5,['Team','H','HR']]
df2.plot(x='Team',y='HR',kind='bar',title='長條圖',color='blue')
plt.show()
df2.plot(kind='area',title='面積圖')
plt.show()
df2.plot(x='H',y='HR',kind='hexbin',title='蜂窩圖',gridsize=10)
plt.show()
df2.plot(x='H',y='HR',kind='scatter',title='散布圖')
plt.show()
#多圖合一
ax1=df2.plot(x='H',y='HR',kind='hexbin',title='蜂窩圖',gridsize=10)
df2.plot(x='H',y='HR',kind='scatter',title='散布圖',ax=ax1)
plt.show()
留言列表