Commit c5885ec2 authored by 王志伟's avatar 王志伟

统计多天重复日记数量,增加过滤个人黑名单

parent 37a31760
...@@ -320,8 +320,8 @@ object Repeated_content_recommendation_moreday { ...@@ -320,8 +320,8 @@ object Repeated_content_recommendation_moreday {
|from data_feed_exposure_precise |from data_feed_exposure_precise
|where cid_type = 'diary' |where cid_type = 'diary'
|and stat_date >='${date}' |and stat_date >='${date}'
|group by device_id,stat_date
|and device_id not in (select device_id from blacklist) |and device_id not in (select device_id from blacklist)
|group by device_id,stat_date
""".stripMargin """.stripMargin
).rdd.map(row=>(row(0).toString,row(1).toString,row(2).toString)).map(row=>(row._2,row._3)).groupByKey() ).rdd.map(row=>(row(0).toString,row(1).toString,row(2).toString)).map(row=>(row._2,row._3)).groupByKey()
.filter(x => x._2.size >1) .filter(x => x._2.size >1)
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment