Commit a483e2b0 authored by 王志伟's avatar 王志伟

新统计需求

parent 5780f800
...@@ -9,6 +9,7 @@ import scopt.OptionParser ...@@ -9,6 +9,7 @@ import scopt.OptionParser
import com.gmei.lib.AbstractParams import com.gmei.lib.AbstractParams
//import org.apache.hadoop.hive.ql.exec.spark.session.SparkSession //import org.apache.hadoop.hive.ql.exec.spark.session.SparkSession
import org.apache.spark.sql.SparkSession import org.apache.spark.sql.SparkSession
import org.apache.spark.sql.functions._
object strategy_other { object strategy_other {
...@@ -259,7 +260,7 @@ object diary_exposure { ...@@ -259,7 +260,7 @@ object diary_exposure {
val final_cid_city = diary_id_temp.join(df_cid_city,Seq("diary_id"),"left_outer").na.drop() val final_cid_city = diary_id_temp.join(df_cid_city,Seq("diary_id"),"left_outer").na.drop()
final_cid_city.show() final_cid_city.show()
final_cid_city.groupBy("name").count().show(30) final_cid_city.groupBy("name").count().orderBy(desc("count"))
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment