Commit 5493b3f5 authored by 郭羽's avatar 郭羽

美购精排模型

parent 094d9856
......@@ -188,5 +188,6 @@ if __name__ == '__main__':
predict(model_file,df_test)
pass
......@@ -212,7 +212,7 @@ def getDataVocab(samples):
for c in samples.columns:
# 判断是否以Bucket结尾 和 类别特征
if c.endswith("Bucket") or c in ITEM_CATE_COLUMNS:
if c.endswith("Bucket") or c in ITEM_CATE_COLUMNS+["userid","itemid"]:
datas = samples.select(c).distinct().collect()
vocabSet = set()
for d in datas:
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment