Commit 5493b3f5 authored by 郭羽's avatar 郭羽

美购精排模型

parent 094d9856
...@@ -188,5 +188,6 @@ if __name__ == '__main__': ...@@ -188,5 +188,6 @@ if __name__ == '__main__':
predict(model_file,df_test) predict(model_file,df_test)
pass pass
...@@ -212,7 +212,7 @@ def getDataVocab(samples): ...@@ -212,7 +212,7 @@ def getDataVocab(samples):
for c in samples.columns: for c in samples.columns:
# 判断是否以Bucket结尾 和 类别特征 # 判断是否以Bucket结尾 和 类别特征
if c.endswith("Bucket") or c in ITEM_CATE_COLUMNS: if c.endswith("Bucket") or c in ITEM_CATE_COLUMNS+["userid","itemid"]:
datas = samples.select(c).distinct().collect() datas = samples.select(c).distinct().collect()
vocabSet = set() vocabSet = set()
for d in datas: for d in datas:
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment