Pandas章節應用的數據能夠在如下連接下載: https://files.cnblogs.com/files/AI-robort/Titanic_Data-master.zipjavascript
import pandas as pd
df=pd.DataFrame({'key':['A','B','C','A','B','C','A','B','C'],
'data':[0,5,10,5,10,15,10,15,20]})
df
for key in['A','B','C']:
print(key,df[df['key']==key].sum())#求每一個key值的求和
df.groupby('key').sum()#和上面的分組是同樣的
import numpy as np
df.groupby('key').aggregate(np.mean)#aggregate是執行操做,如np的sum 、mean等
df1=pd.read_csv('./Titanic_Data-master/Titanic_Data-master/train.csv')
df1.groupby('Sex')['Age'].mean()#統計性別對應的年齡的均值
df1.groupby('Sex')['Survived'].mean()#統計性別對應的獲救的平均機率