import pandas as pd
data = pd.read_csv("C:/Users/admin/Desktop/beikezhaofang.csv")
data.head()
|
price |
unitprice |
region |
build_year |
house_type |
house_Size |
elevator |
floor_type |
0 |
280.0 |
51150.9 |
dongcheng |
1990 |
2室1厅 |
54.74 |
0 |
地下室 |
1 |
395.0 |
68839.3 |
dongcheng |
1981 |
2室1厅 |
57.38 |
0 |
中楼层 |
2 |
450.0 |
58631.9 |
dongcheng |
2010 |
1室0厅 |
76.75 |
1 |
中楼层 |
3 |
467.0 |
67446.6 |
dongcheng |
2005 |
1室1厅 |
69.24 |
1 |
高楼层 |
4 |
1050.0 |
105189.0 |
dongcheng |
2006 |
2室1厅 |
99.82 |
1 |
高楼层 |
data["region"].value_counts()
xicheng 1499
chaoyang 1498
shijingshan 1494
fengtai 1489
dongcheng 1488
changping 1486
haidian 1486
tongzhou 1485
daxing 1478
shunyi 1467
fangshan 1444
mentougou 1143
yizhuangkaifaqu 1052
pinggu 48
miyun 28
huairou 16
yanqing 7
Name: region, dtype: int64
data.loc[data["region"] == "xicheng","region"] = "西城"
data.loc[data["region"] == "chaoyang","region"] = "朝阳"
data.loc[data["region"] == "shijingshan","region"] = "石景山"
data.loc[data["region"] == "fengtai","region"] = "丰台"
data.loc[data["region"] == "dongcheng","region"] = "东城"
data.loc[data["region"] == "haidian","region"] = "海淀"
data.loc[data["region"] == "changping","region"] = "昌平"
data.loc[data["region"] == "tongzhou","region"] = "通州"
data.loc[data["region"] == "daxing","region"] = "大兴"
data.loc[data["region"] == "shunyi","region"] = "顺义"
data.loc[data["region"] == "fangshan","region"] = "房山"
data.loc[data["region"] == "mentougou","region"] = "门头沟"
data.loc[data["region"] == "yizhuangkaifaqu","region"] = "亦庄"
data.loc[data["region"] == "pinggu","region"] = "平谷"
data.loc[data["region"] == "miyun","region"] = "顺义"
data.loc[data["region"] == "huairou","region"] = "怀柔"
data.loc[data["region"] == "yanqing","region"] = "延庆"
data["region"].value_counts()
西城 1499
朝阳 1498
顺义 1495
石景山 1494
丰台 1489
东城 1488
昌平 1486
海淀 1486
通州 1485
大兴 1478
房山 1444
门头沟 1143
亦庄 1052
平谷 48
怀柔 16
延庆 7
Name: region, dtype: int64
data.to_csv('data1.csv', index=False)
data.head()
|
price |
unitprice |
region |
build_year |
house_type |
house_Size |
elevator |
floor_type |
0 |
280.0 |
51150.9 |
东城 |
1990 |
2室1厅 |
54.74 |
0 |
地下室 |
1 |
395.0 |
68839.3 |
东城 |
1981 |
2室1厅 |
57.38 |
0 |
中楼层 |
2 |
450.0 |
58631.9 |
东城 |
2010 |
1室0厅 |
76.75 |
1 |
中楼层 |
3 |
467.0 |
67446.6 |
东城 |
2005 |
1室1厅 |
69.24 |
1 |
高楼层 |
4 |
1050.0 |
105189.0 |
东城 |
2006 |
2室1厅 |
99.82 |
1 |
高楼层 |