Commit bfa8847f authored by 郭羽's avatar 郭羽

排序模型优化

parent 75815fee
...@@ -315,7 +315,7 @@ def addUserFeatures(samples,dataVocab,multiVocab): ...@@ -315,7 +315,7 @@ def addUserFeatures(samples,dataVocab,multiVocab):
return samples return samples
def addSampleLabel(ratingSamples): def addSampleLabel(ratingSamples):
ratingSamples = ratingSamples.withColumn('label', when(F.col('rating') >= 5, 1).otherwise(0)) ratingSamples = ratingSamples.withColumn('label', when(F.col('rating') >= 1, 1).otherwise(0))
ratingSamples.show(5, truncate=False) ratingSamples.show(5, truncate=False)
ratingSamples.printSchema() ratingSamples.printSchema()
return ratingSamples return ratingSamples
...@@ -852,8 +852,8 @@ if __name__ == '__main__': ...@@ -852,8 +852,8 @@ if __name__ == '__main__':
df = ratingSamplesWithLabel.toPandas() df = ratingSamplesWithLabel.toPandas()
df = pd.DataFrame(df) df = pd.DataFrame(df)
posCount = df.loc[df["label"]==0]["label"].count() posCount = df.loc[df["label"]==1]["label"].count()
negCount = df.loc[df["label"]==1]["label"].count() negCount = df.loc[df["label"]==0]["label"].count()
print("pos size:"+str(posCount),"neg size:"+str(negCount)) print("pos size:"+str(posCount),"neg size:"+str(negCount))
itemDF = get_service_feature_df() itemDF = get_service_feature_df()
......
This diff is collapsed.
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment