diff --git a/task/spark_test.py b/task/spark_test.py index 2ff61bf18b889272188b8797e57b5619e9d76528..fb47382d1167396d29619a0c0fceba9b7dd1ed4c 100644 --- a/task/spark_test.py +++ b/task/spark_test.py @@ -155,7 +155,7 @@ huidu_device_id_df = spark.sql(huidu_device_id_sql) huidu_device_id_df.createOrReplaceTempView("dev_view") sql_search_ctr = r""" SELECT - count(1) + count(distinct (a.cl_id)) FROM (select device_id from dev_view) t1 left join ( @@ -178,7 +178,7 @@ sql_search_ctr = r""" transaction_type, card_id, app_session_id - )a on t1.device_id = a.cl_id group by a.device_id + )a on t1.device_id = a.cl_id """.format(today_str='20200926') print(sql_search_ctr)