import csv
f=open("C:\ProgramData\Anaconda3\Scripts\white_wine.csv","r")
reader=csv.reader(f)
data=[ ]
for row in reader:
data.append(row)
for i in range(5):
print(data[i])
f.close
2、处理数据content_dict={}
for row in data[1:]:
quality=int(row[-1])
if quality not in content_dict.keys():
content_dict[quality]=[row]
else:
content_dict[quality].append(row)
for key in content_dict:
print(key,":",len(content_dict[key]))
2)统计每种等级的数量content_dict={}
for row in data[1:]:
quality=int(row[-1])
if quality not in content_dict.keys():
content_dict[quality]=[row]
else:
content_dict[quality].append(row)
for key in content_dict:
print(key,":",len(content_dict[key]))
3)计算每个数据集中fixed acidity的均值mean_list=[]
for key,value in content_dict.items():
sum=0
for row in value:
sum+=float(row[0])
mean_list.append((key,sum/len(value)))
for item in mean_list:
print(item[0],":",item[1])
4、思考题
计算每个数据集中fixed acidity低于均值的数目。
通过遍历来统计,代码可这样写:
means=[x[-1] for x in mean_list]
for (k,v),m in zip(content_dict.items(),means):
count=0
for row in v:
count+=float(row[0])<m
print(k,count)
如对你有帮助,请点击采纳按钮。
您好,我是有问必答小助手,您的问题已经有小伙伴帮您解答,感谢您对有问必答的支持与关注!