Commit ec20028a authored by 高雅喆's avatar 高雅喆

update

parent 7575e6c5
......@@ -141,7 +141,15 @@ if __name__ == '__main__':
device_ids_lst_rdd = spark.sparkContext.parallelize(device_ids_lst)
gm_kv_cli = redis.Redis(host="172.16.40.135", port=5379, db=6, socket_timeout=2000)
result = device_ids_lst_rdd.repartition(100).map(lambda x: get_user_tag_score(x, all_log_df)).toDF()
result.show()
result = device_ids_lst_rdd.repartition(100).map(lambda x: get_user_tag_score(x, all_log_df)).toDF("cl_id","tag_list")
stat_date = datetime.datetime.today().strftime('%Y-%m-%d')
result_last = result.withColumn("stat_date", lit(stat_date))
result_last.show()
result_last.write.format("jdbc").options(
url='jdbc:mysql://172.16.40.158/jerry_test',
driver='com.mysql.jdbc.Driver',
dbtable='user_portrait_tags',
user='root',
password='3SYz54LS9#^9sBvC').mode('overwrite').save()
except Exception as e:
print(e)
\ No newline at end of file
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment