1. Home
  2. Docs
  3. Python
  4. Pandas
  5. 均一化

均一化

df = pd.read_excel('桃園全區實價登錄資料_20190430修改後_轉數字_lite.xls',0)

#全部的空白
df=df.fillna(-1)

print(df.head())
print(df.columns)
print(df.index)
print(df.columns)

columnsName=['鄉鎮市區_Code','交易標的_Code','土地區段位置建物區段門牌_Code']
dfX=df[columnsName]
dfY=df["總價元"]

dfX = (dfX - dfX.min()) / (dfX.max() - dfX.min())

dfY = (dfY - dfY2.min()) / (dfY2.max() - dfY2.min())  # 均一化

X=dfX.to_numpy()
Y=dfY.to_numpy()
X_train ,X_test ,Y_train ,Y_test = train_test_split(X,Y,test_size=0.01)