Commit a0be2abc authored by 郭羽's avatar 郭羽

美购精排模型

parent e3a53854
...@@ -39,18 +39,18 @@ def getDataVocabFromRedis(version): ...@@ -39,18 +39,18 @@ def getDataVocabFromRedis(version):
return dataVocab return dataVocab
# 数据类型转换 # 数据类型转换
def csvTypeConvert(df,data_vocab): def csvTypeConvert(columns,df,data_vocab):
# 离散na值填充 for k in columns:
for k, v in data_vocab.items(): # 离散na值填充
df[k] = df[k].fillna("-1") if k in data_vocab.items():
df[k] = df[k].astype("string") df[k] = df[k].astype("string")
df[k] = df[k].fillna("-1")
for k in ITEM_NUMBER_COLUMNS: else:
df[k] = df[k].fillna(0.0) df[k] = df[k].astype("float")
df[k] = df[k].astype("float") df[k] = df[k].fillna(0.0)
df["label"] = df["label"].astype("int") df["label"] = df["label"].astype("int")
print(df.dtypes) # print(df.dtypes)
return df return df
def loadData(data_path): def loadData(data_path):
...@@ -166,8 +166,8 @@ if __name__ == '__main__': ...@@ -166,8 +166,8 @@ if __name__ == '__main__':
print("trainSize:{},testSize{}".format(trainSize,testSize)) print("trainSize:{},testSize{}".format(trainSize,testSize))
# 数据类型转换 # 数据类型转换
df_train = csvTypeConvert(df_train,data_vocab) df_train = csvTypeConvert(datasColumns,df_train,data_vocab)
df_test = csvTypeConvert(df_test,data_vocab) df_test = csvTypeConvert(datasColumns,df_test,data_vocab)
# 获取训练数据 # 获取训练数据
train_data = getDataSet(df_train,shuffleSize=trainSize,) train_data = getDataSet(df_train,shuffleSize=trainSize,)
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment