Commit dddaef01 authored by 张彦钊's avatar 张彦钊

change test file

parent ef64e1b8
......@@ -198,25 +198,28 @@ def con_sql(db,sql):
def test():
# sql = "select stat_date,cid_id from esmm_train_data e where stat_date = '{}' limit 60".format("2019-04-25")
# df = spark.createDataFrame(spark.sql(sql).rdd.map(lambda x:(x[0],x[1])).zipWithIndex()
# .map(lambda x:(x[1],x[0][0],x[0][1]))).toDF("ind","k","v")
# df.show(6)
# # df.write.csv('/recommend/tr', mode='overwrite', header=True)
# df = df.toPandas()
from hdfs import InsecureClient
from hdfs.ext.dataframe import read_dataframe
from hdfs.ext.dataframe import write_dataframe
sql = "select stat_date,cid_id from esmm_train_data e where stat_date = '{}' limit 60".format("2019-04-25")
df = spark.createDataFrame(spark.sql(sql).rdd.map(lambda x:(x[0],x[1])).zipWithIndex()
.map(lambda x:(x[1],x[0][0],x[0][1]))).toDF("ind","k","v")
df.show(6)
df.write.csv('/recommend/tr', mode='overwrite', header=True)
df.write.format("avro").mode("overwrite").save("/recommend/tr/avro.csv")
client = InsecureClient('http://nvwa01:50070')
# write_dataframe(client, '/recommend/va/a.csv', df)
df = read_dataframe(client,"/recommend/va/a.csv")
print(df.head())
#
# from hdfs import InsecureClient
# from hdfs.ext.dataframe import read_dataframe
# from hdfs.ext.dataframe import write_dataframe
#
#
# client = InsecureClient('http://nvwa01:50070')
# # write_dataframe(client, '/recommend/va/a.csv', df)
#
# df = read_dataframe(client,"/recommend/va/a.csv")
#
#
# print(df.head())
# spark.sql("use online")
# spark.sql("ADD JAR /srv/apps/brickhouse-0.7.1-SNAPSHOT.jar")
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment