diff --git a/diary-training.py b/diary-training.py index 1fef962271e7bc1fb0f65814ac9ade092fcd8046..05212196368b7245810ba20adda0524293efd6c3 100644 --- a/diary-training.py +++ b/diary-training.py @@ -4,6 +4,8 @@ import pandas as pd from sklearn.utils import shuffle import numpy as np import xlearn as xl + + # 从数æ®åº“的表里获å–æ•°æ®ï¼Œå¹¶è½¬åŒ–æˆdfæ ¼å¼ def con_sql(sql): db = pymysql.connect(host='10.66.157.22', port=4000, user='root', passwd='3SYz54LS9#^9sBvC', db='jerry_test') @@ -14,6 +16,7 @@ def con_sql(sql): db.close() return df + # 获å–点击表里的device_id sql = "select distinct device_id from data_feed_click" click_device_id = con_sql(sql)[0].values.tolist() @@ -161,9 +164,9 @@ ffm_model.setTrain("/home/zhangyanzhao/data.csv") # ffm_model.setValidate("/home/zhangyanzhao/validation.csv") param = {'task':'binary', 'lr':0.05, - 'lambda':0.002, 'metric':'auc'} + 'lambda':0.002, 'metric':'auc', 'fold':3} -ffm_model.fit(param, '/home/zhangyanzhao/model.out') +ffm_model.cv(param, '/home/zhangyanzhao/model.out') ''' ffm_model.setTest("/home/zhangyanzhao/test.csv")