import pandas as pd
data = pd.read_csv("C:/Users/admin/Desktop/beikezhaofang.csv")
data.head()
|
price |
unitprice |
region |
build_year |
house_type |
house_Size |
elevator |
floor_type |
0 |
280.0 |
51150.9 |
dongcheng |
1990 |
2室1廳 |
54.74 |
0 |
地下室 |
1 |
395.0 |
68839.3 |
dongcheng |
1981 |
2室1廳 |
57.38 |
0 |
中樓層 |
2 |
450.0 |
58631.9 |
dongcheng |
2010 |
1室0廳 |
76.75 |
1 |
中樓層 |
3 |
467.0 |
67446.6 |
dongcheng |
2005 |
1室1廳 |
69.24 |
1 |
高樓層 |
4 |
1050.0 |
105189.0 |
dongcheng |
2006 |
2室1廳 |
99.82 |
1 |
高樓層 |
data["region"].value_counts()
xicheng 1499
chaoyang 1498
shijingshan 1494
fengtai 1489
dongcheng 1488
changping 1486
haidian 1486
tongzhou 1485
daxing 1478
shunyi 1467
fangshan 1444
mentougou 1143
yizhuangkaifaqu 1052
pinggu 48
miyun 28
huairou 16
yanqing 7
Name: region, dtype: int64
data.loc[data["region"] == "xicheng","region"] = "西城"
data.loc[data["region"] == "chaoyang","region"] = "朝陽"
data.loc[data["region"] == "shijingshan","region"] = "石景山"
data.loc[data["region"] == "fengtai","region"] = "豐臺"
data.loc[data["region"] == "dongcheng","region"] = "東城"
data.loc[data["region"] == "haidian","region"] = "海淀"
data.loc[data["region"] == "changping","region"] = "昌平"
data.loc[data["region"] == "tongzhou","region"] = "通州"
data.loc[data["region"] == "daxing","region"] = "大興"
data.loc[data["region"] == "shunyi","region"] = "順義"
data.loc[data["region"] == "fangshan","region"] = "房山"
data.loc[data["region"] == "mentougou","region"] = "門頭溝"
data.loc[data["region"] == "yizhuangkaifaqu","region"] = "亦莊"
data.loc[data["region"] == "pinggu","region"] = "平谷"
data.loc[data["region"] == "miyun","region"] = "順義"
data.loc[data["region"] == "huairou","region"] = "懷柔"
data.loc[data["region"] == "yanqing","region"] = "延慶"
data["region"].value_counts()
西城 1499
朝陽 1498
順義 1495
石景山 1494
豐臺 1489
東城 1488
昌平 1486
海淀 1486
通州 1485
大興 1478
房山 1444
門頭溝 1143
亦莊 1052
平谷 48
懷柔 16
延慶 7
Name: region, dtype: int64
data.to_csv('data1.csv', index=False)
data.head()
|
price |
unitprice |
region |
build_year |
house_type |
house_Size |
elevator |
floor_type |
0 |
280.0 |
51150.9 |
東城 |
1990 |
2室1廳 |
54.74 |
0 |
地下室 |
1 |
395.0 |
68839.3 |
東城 |
1981 |
2室1廳 |
57.38 |
0 |
中樓層 |
2 |
450.0 |
58631.9 |
東城 |
2010 |
1室0廳 |
76.75 |
1 |
中樓層 |
3 |
467.0 |
67446.6 |
東城 |
2005 |
1室1廳 |
69.24 |
1 |
高樓層 |
4 |
1050.0 |
105189.0 |
東城 |
2006 |
2室1廳 |
99.82 |
1 |
高樓層 |