Pandas章节应用的数据能够在如下连接下载: https://files.cnblogs.com/files/AI-robort/Titanic_Data-master.zipjavascript
import pandas as pd
df=pd.DataFrame({'key':['A','B','C','A','B','C','A','B','C'],
'data':[0,5,10,5,10,15,10,15,20]})
df
for key in['A','B','C']:
print(key,df[df['key']==key].sum())#求每一个key值的求和
df.groupby('key').sum()#和上面的分组是同样的
import numpy as np
df.groupby('key').aggregate(np.mean)#aggregate是执行操做,如np的sum 、mean等
df1=pd.read_csv('./Titanic_Data-master/Titanic_Data-master/train.csv')
df1.groupby('Sex')['Age'].mean()#统计性别对应的年龄的均值
df1.groupby('Sex')['Survived'].mean()#统计性别对应的获救的平均几率