Commit 57567111 authored by 张彦钊's avatar 张彦钊

change test file

parent 23fd48e1
...@@ -34,7 +34,8 @@ def multi_hot(df,column,n): ...@@ -34,7 +34,8 @@ def multi_hot(df,column,n):
def feature_engineer(): def feature_engineer():
# TODO 删除下面的测试写入 # TODO 删除下面的测试写入
df = spark.sql("select y,z from esmm_train_data limit 60") df = spark.sql("select y,z from esmm_train_data limit 60")
df.write.format("avro").save(path=path + "tr", mode="overwrite") df.write.format("com.databricks.spark.avro").save(path=path + "tr", mode="overwrite")
print("done")
db = pymysql.connect(host='172.16.40.158', port=4000, user='root', passwd='3SYz54LS9#^9sBvC', db='jerry_test') db = pymysql.connect(host='172.16.40.158', port=4000, user='root', passwd='3SYz54LS9#^9sBvC', db='jerry_test')
sql = "select max(stat_date) from esmm_train_data" sql = "select max(stat_date) from esmm_train_data"
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment