# 早下班系列：比Python更称手的兵器

import pandas

f = open(‘D:/data.txt’, ‘r‘)

try:

a = f.read( )

finally:

f.close( )

b = []

for i in a.split(“\n”):

b.append(i.split(” “))

for i in range(1, len(b)):

b[i][4] = b[i][4].replace(“\$”,‘ ‘)

b[i][4] = b[i][4].replace(“,”,‘ ‘)

for i in range(1, len(b)):

for j in [1, 2, 3, 4]:

b[i][j] = eval(b[i][j])

data = pandas.DataFrame(b[1:],columns=b[0])

out = data.groupby([‘STYLE’,‘BEDROOMS’]).mean()

print(out)

import pandas

import time

start = time.clock()

f = open(‘D:/data2.txt‘, ‘r’)

try:

a = f.read( )

finally:

f.close( )

b = []

for i in a.split(“\n”):

b.append(i.split(” “))

for i in range(1, len(b)):

b[i][4] = b[i][4].replace(“\$”,‘ ‘)

b[i][4] = b[i][4].replace(“,”,‘ ‘)

for i in range(1, len(b)):

for j in [1, 2, 3, 4]:

b[i][j] = eval(b[i][j])

data = pandas.DataFrame(b[1:],columns=b[0])

out = data.groupby([‘STYLE’,‘BEDROOMS’]).mean()

elapsed = (time.clock() – start)

print(elapsed)

1391毫秒约等于1.4秒（请注意此处有个小数点……）

