import pandas as pd import numpy as np
url = 'https://raw.githubusercontent.com/justmarkham/DAT8/master/data/chipotle.tsv'
chipo = pd.read_csv(url,sep = '\t')
pd.set_option('display.width',1000)
print(chipo.head(10))
print(chipo.info())
print(chipo.shape[1])
print(chipo.columns)
print(chipo.index)
print(chipo.item_name.value_counts().head(1))
print(chipo.item_name.nunique())
print(chipo.choice_description.value_counts().head(1))
print(chipo.quantity.sum())
dollarizer = lambda x: float(x[1:-1]) chipo.item_price = chipo.item_price.apply(dollarizer) print(chipo.item_price)
print(chipo.item_price.sum())
print(chipo.order_id.value_counts().count())
order_grouped = chipo.groupby(by=['order_id']).sum() avgsum = order_grouped.mean()['item_price'] print(avgsum)
print(chipo.groupby(by=['order_id']).sum().mean()['item_price'])
print(chipo.item_name.value_counts().count())
本文由 所长 创作,采用 知识共享署名4.0 国际许可协议进行许可 本站文章除注明转载/出处外,均为本站原创或翻译,转载前请务必署名 最后编辑时间为: Apr 21, 2018 at 10:22 am