find_bug.scala 24.9 KB
Newer Older
王志伟's avatar
王志伟 committed
1 2 3 4
package com.gmei

import java.io.Serializable

王志伟's avatar
王志伟 committed
5
import com.gmei.WeafareStat.{defaultParams, parser}
王志伟's avatar
王志伟 committed
6
import org.apache.spark.sql.{SaveMode}
王志伟's avatar
王志伟 committed
7
//import org.apache.spark.sql.{SaveMode}
王志伟's avatar
王志伟 committed
8 9
import org.apache.log4j.{Level, Logger}
import scopt.OptionParser
王志伟's avatar
王志伟 committed
10
import com.gmei.lib.AbstractParams
王志伟's avatar
王志伟 committed
11

王志伟's avatar
王志伟 committed
12
object find_bug {
王志伟's avatar
王志伟 committed
13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46

  Logger.getLogger("org.apache.spark").setLevel(Level.WARN)
  Logger.getLogger("org.apache.eclipse.jetty.server").setLevel(Level.OFF)

  case class Params(env: String = "dev",
                    date: String = "2018-08-01"
                   ) extends AbstractParams[Params] with Serializable

  val defaultParams = Params()

  val parser = new OptionParser[Params]("Feed_EDA") {
    head("WeafareStat")
    opt[String]("env")
      .text(s"the databases environment you used")
      .action((x, c) => c.copy(env = x))
    opt[String] ("date")
      .text(s"the date you used")
      .action((x,c) => c.copy(date = x))
    note(
      """
        |For example, the following command runs this app on a tidb dataset:
        |
        | spark-submit --class com.gmei.WeafareStat ./target/scala-2.11/feededa-assembly-0.1.jar \
      """.stripMargin +
        s"|   --env ${defaultParams.env}"
    )
  }

  def main(args: Array[String]): Unit = {
    parser.parse(args, defaultParams).map { param =>
      GmeiConfig.setup(param.env)
      val spark_env = GmeiConfig.getSparkSession()
      val sc = spark_env._2

王志伟's avatar
王志伟 committed
47 48 49 50 51 52 53
//      val ti = new TiContext(sc)
      sc.sql("use jerry_prod")
//      ti.tidbMapTable(dbName = "jerry_prod", tableName = "diary_video")
//      ti.tidbMapTable(dbName = "jerry_prod", tableName = "data_feed_click")
//      ti.tidbMapTable(dbName = "jerry_prod", tableName = "blacklist")
//      ti.tidbMapTable(dbName = "jerry_prod", tableName = "data_feed_exposure")
//      ti.tidbMapTable(dbName = "jerry_prod", tableName = "merge_queue_table")
王志伟's avatar
王志伟 committed
54 55


王志伟's avatar
王志伟 committed
56 57
      val stat_date = GmeiConfig.getMinusNDate(1)
//      val stat_date = param.date
王志伟's avatar
王志伟 committed
58
      println(stat_date)
王志伟's avatar
王志伟 committed
59
      val partition_date = stat_date.replace("-","")
王志伟's avatar
王志伟 committed
60 61 62 63 64 65 66 67 68 69 70
      val decive_id_oldUser = sc.sql(
        s"""
           |select distinct(device_id) as device_id
           |from online.ml_device_day_active_status
           |where active_type = '4'
           |and first_channel_source_type not in ('yqxiu1','yqxiu2','yqxiu3','yqxiu4','yqxiu5','mxyc1','mxyc2','mxyc3'
           |    ,'wanpu','jinshan','jx','maimai','zhuoyi','huatian','suopingjingling','mocha','mizhe','meika','lamabang'
           |    ,'js-az1','js-az2','js-az3','js-az4','js-az5','jfq-az1','jfq-az2','jfq-az3','jfq-az4','jfq-az5','toufang1'
           |    ,'toufang2','toufang3','toufang4','toufang5','toufang6','TF-toufang1','TF-toufang2','TF-toufang3','TF-toufang4'
           |    ,'TF-toufang5','tf-toufang1','tf-toufang2','tf-toufang3','tf-toufang4','tf-toufang5','benzhan','promotion_aso100'
           |    ,'promotion_qianka','promotion_xiaoyu','promotion_dianru','promotion_malioaso','promotion_malioaso-shequ'
王志伟's avatar
王志伟 committed
71
           |    ,'promotion_shike','promotion_julang_jl03','','unknown','promotion_zuimei')
王志伟's avatar
王志伟 committed
72 73 74
           |and partition_date ='${partition_date}'
         """.stripMargin
      )
王志伟's avatar
王志伟 committed
75
      decive_id_oldUser.show()
王志伟's avatar
王志伟 committed
76 77 78 79 80 81
      decive_id_oldUser.createOrReplaceTempView("device_id_old")


      val clk_count_oldUser_Contrast = sc.sql(
        s"""
           |select '${stat_date}' as stat_date, count(cid_id) as clk_count_oldUser_Contrast
王志伟's avatar
王志伟 committed
82
           |from jerry_prod.data_feed_click jd inner join device_id_old
王志伟's avatar
王志伟 committed
83 84 85 86 87 88 89
           |on jd.device_id = device_id_old.device_id
           |where  (jd.cid_type = 'diary' or jd.cid_type = 'diary_video')
           |and jd.device_id regexp'1$$'
           |and jd.device_id not in (select device_id from blacklist)
           |and jd.stat_date ='${stat_date}'
         """.stripMargin
      )
王志伟's avatar
王志伟 committed
90 91
      clk_count_oldUser_Contrast.show()

王志伟's avatar
王志伟 committed
92

王志伟's avatar
王志伟 committed
93
      val imp_count_oldUser_Contrast = sc.sql(
王志伟's avatar
王志伟 committed
94
        s"""
王志伟's avatar
王志伟 committed
95
           |select '${stat_date}' as stat_date, count(cid_id) as imp_count_oldUser_Contrast
王志伟's avatar
王志伟 committed
96
           |from jerry_prod.data_feed_exposure je inner join device_id_old
王志伟's avatar
王志伟 committed
97 98 99 100 101
           |on je.device_id = device_id_old.device_id
           |where je.cid_type = 'diary'
           |and je.device_id regexp'1$$'
           |and je.device_id not in (select device_id from blacklist)
           |and je.stat_date ='${stat_date}'
王志伟's avatar
王志伟 committed
102 103
         """.stripMargin
      )
王志伟's avatar
王志伟 committed
104 105
      imp_count_oldUser_Contrast.show()

王志伟's avatar
王志伟 committed
106

王志伟's avatar
王志伟 committed
107
      val clk_count_oldUser_all = sc.sql(
王志伟's avatar
王志伟 committed
108
        s"""
王志伟's avatar
王志伟 committed
109
           |select '${stat_date}' as stat_date, count(cid_id) as clk_count_oldUser_all
王志伟's avatar
王志伟 committed
110
           |from jerry_prod.data_feed_click jd inner join device_id_old
王志伟's avatar
王志伟 committed
111 112 113 114 115 116
           |on jd.device_id = device_id_old.device_id
           |where  (jd.cid_type = 'diary' or jd.cid_type = 'diary_video')
           |and jd.device_id not in (select device_id from blacklist)
           |and jd.stat_date ='${stat_date}'
         """.stripMargin
      )
王志伟's avatar
王志伟 committed
117
      clk_count_oldUser_all.show()
王志伟's avatar
王志伟 committed
118 119 120 121

      val imp_count_oldUser_all = sc.sql(
        s"""
           |select '${stat_date}' as stat_date, count(cid_id) as imp_count_oldUser_all
王志伟's avatar
王志伟 committed
122
           |from jerry_prod.data_feed_exposure je inner join device_id_old
王志伟's avatar
王志伟 committed
123 124 125 126
           |on je.device_id = device_id_old.device_id
           |where je.cid_type = 'diary'
           |and je.device_id not in (select device_id from blacklist)
           |and je.stat_date ='${stat_date}'
王志伟's avatar
王志伟 committed
127 128
         """.stripMargin
      )
王志伟's avatar
王志伟 committed
129
      imp_count_oldUser_all.show()
王志伟's avatar
王志伟 committed
130 131


王志伟's avatar
王志伟 committed
132 133 134
      val result1 = clk_count_oldUser_Contrast.join(imp_count_oldUser_Contrast,"stat_date")
        .join(clk_count_oldUser_all,"stat_date")
        .join(imp_count_oldUser_all,"stat_date")
王志伟's avatar
王志伟 committed
135 136
      result1.show()

王志伟's avatar
王志伟 committed
137
//      GmeiConfig.writeToJDBCTable(result1, "bug_Recommendation_strategy_temp", SaveMode.Append)
王志伟's avatar
王志伟 committed
138 139 140
//      GmeiConfig.writeToJDBCTable("jdbc:mysql://152.136.44.138:4000/jerry_prod?user=root&password=3SYz54LS9#^9sBvC&rewriteBatchedStatements=true",result1, table="bug_Recommendation_strategy_temp",SaveMode.Append)

      println("开始写入")
王志伟's avatar
王志伟 committed
141 142
//      GmeiConfig.writeToJDBCTable("jerry.jdbcuri",result1, table="bug_Recommendation_strategy_temp",SaveMode.Append)
      GmeiConfig.writeToJDBCTable("jdbc:mysql://172.16.40.158:4000/jerry_prod?user=root&password=3SYz54LS9#^9sBvC&rewriteBatchedStatements=true",result1, table="bug_Recommendation_strategy_temp",SaveMode.Append)
王志伟's avatar
王志伟 committed
143 144
      println("写入完成")

王志伟's avatar
王志伟 committed
145

王志伟's avatar
王志伟 committed
146 147


王志伟's avatar
王志伟 committed
148 149 150 151
      //device_id尾号1有点击用户日记本点击数
      val clk_active_1 = sc.sql(
        s"""
           |select '${stat_date}' as stat_date, count(jd.cid_id) as clk_active_1
王志伟's avatar
王志伟 committed
152
           |from jerry_prod.data_feed_click jd inner join device_id_old
王志伟's avatar
王志伟 committed
153 154 155 156 157 158 159
           |on jd.device_id = device_id_old.device_id
           |where  (jd.cid_type = 'diary' or jd.cid_type = 'diary_video')
           |and jd.device_id regexp'1$$'
           |and jd.device_id not in (select device_id from blacklist)
           |and jd.stat_date ='${stat_date}'
         """.stripMargin
      )
王志伟's avatar
王志伟 committed
160
      clk_active_1.show()
王志伟's avatar
王志伟 committed
161 162 163 164 165

      //device_id尾号1有点击用户日记本曝光数
      val imp_active_1 = sc.sql(
        s"""
           |select '${stat_date}' as stat_date, count(je.cid_id) as imp_active_1
王志伟's avatar
王志伟 committed
166
           |from jerry_prod.data_feed_exposure je inner join device_id_old
王志伟's avatar
王志伟 committed
167 168 169 170 171 172 173
           |on je.device_id = device_id_old.device_id
           |where je.cid_type = 'diary'
           |and je.device_id in (select distinct(device_id) from data_feed_click where device_id regexp '1$$' and stat_date = '${stat_date}')
           |and je.device_id not in (select device_id from blacklist)
           |and je.stat_date ='${stat_date}'
         """.stripMargin
      )
王志伟's avatar
王志伟 committed
174
      imp_active_1.show()
王志伟's avatar
王志伟 committed
175 176 177 178 179

      //device_id尾号1点击日记本用户数
      val clk_diary_device = sc.sql(
        s"""
           |select '${stat_date}' as stat_date, count(distinct(jd.device_id)) as clk_diary_device
王志伟's avatar
王志伟 committed
180
           |from jerry_prod.data_feed_click jd inner join device_id_old
王志伟's avatar
王志伟 committed
181 182 183 184 185 186 187
           |on jd.device_id = device_id_old.device_id
           |where  (jd.cid_type = 'diary' or jd.cid_type = 'diary_video')
           |and jd.device_id regexp'1$$'
           |and jd.device_id not in (select device_id from blacklist)
           |and jd.stat_date ='${stat_date}'
            """.stripMargin
      )
王志伟's avatar
王志伟 committed
188
      clk_diary_device.show()
王志伟's avatar
王志伟 committed
189 190 191 192 193

      //所有有点击用户日记本点击数
      val clk_active_all = sc.sql(
        s"""
           |select '${stat_date}' as stat_date, count(jd.cid_id) as clk_active_all
王志伟's avatar
王志伟 committed
194
           |from jerry_prod.data_feed_click jd inner join device_id_old
王志伟's avatar
王志伟 committed
195 196 197 198 199 200
           |on jd.device_id = device_id_old.device_id
           |where  (jd.cid_type = 'diary' or jd.cid_type = 'diary_video')
           |and jd.device_id not in (select device_id from blacklist)
           |and jd.stat_date ='${stat_date}'
          """.stripMargin
      )
王志伟's avatar
王志伟 committed
201
      clk_active_all.show()
王志伟's avatar
王志伟 committed
202 203 204 205 206

      //所有有点击用户日记本曝光数
      val imp_active_all = sc.sql(
        s"""
           |select '${stat_date}' as stat_date, count(je.cid_id) as imp_active_all
王志伟's avatar
王志伟 committed
207
           |from jerry_prod.data_feed_exposure je inner join device_id_old
王志伟's avatar
王志伟 committed
208 209 210 211 212 213 214
           |on je.device_id = device_id_old.device_id
           |where je.cid_type = 'diary'
           |and je.device_id in (select distinct(device_id) from data_feed_click where stat_date = '${stat_date}')
           |and je.device_id not in (select device_id from blacklist)
           |and je.stat_date ='${stat_date}'
          """.stripMargin
      )
王志伟's avatar
王志伟 committed
215
      imp_active_all.show()
王志伟's avatar
王志伟 committed
216 217 218 219 220

      //策略命中用户点击日记本用户数
      val clk_diary_device_cover = sc.sql(
        s"""
           |select '${stat_date}' as stat_date,count(distinct(device_id)) as clk_diary_device_cover
王志伟's avatar
王志伟 committed
221
           |from jerry_prod.merge_queue_table
王志伟's avatar
王志伟 committed
222 223 224
           |where device_id in (select distinct(device_id) from data_feed_click where stat_date = '${stat_date}')
          """.stripMargin
      )
王志伟's avatar
王志伟 committed
225
      clk_diary_device_cover.show()
王志伟's avatar
王志伟 committed
226 227 228 229 230

      //策略命中用户总数
      val device_all_cover = sc.sql(
        s"""
           |select '${stat_date}' as stat_date,count(distinct(device_id)) as device_all_cover
王志伟's avatar
王志伟 committed
231
           |from jerry_prod.merge_queue_table
王志伟's avatar
王志伟 committed
232 233
          """.stripMargin
      )
王志伟's avatar
王志伟 committed
234 235
      device_all_cover.show()

王志伟's avatar
王志伟 committed
236 237 238 239 240 241 242 243 244

      val result2 = clk_active_1.join(imp_active_1,"stat_date")
        .join(clk_active_all,"stat_date")
        .join(imp_active_all,"stat_date")
        .join(clk_diary_device,"stat_date")
        .join(clk_diary_device_cover,"stat_date")
        .join(device_all_cover,"stat_date")
      result2.show()

王志伟's avatar
王志伟 committed
245 246
//      GmeiConfig.writeToJDBCTable(result2, "bug_strategy_other", SaveMode.Append)
      println("开始写入")
王志伟's avatar
王志伟 committed
247 248 249
//      GmeiConfig.writeToJDBCTable("jerry.jdbcuri",result2, table="bug_strategy_other",SaveMode.Append)
//      println("写入完成")
      GmeiConfig.writeToJDBCTable("jdbc:mysql://172.16.40.158:4000/jerry_prod?user=root&password=3SYz54LS9#^9sBvC&rewriteBatchedStatements=true",result2, table="bug_strategy_other",SaveMode.Append)
王志伟's avatar
王志伟 committed
250
      println("写入完成")
王志伟's avatar
王志伟 committed
251 252 253 254 255 256 257


      //统计新用户点击率
      val devicee_id_newUser = sc.sql(
        s"""
           |select distinct(device_id) as device_id
           |from online.ml_device_day_active_status
王志伟's avatar
王志伟 committed
258
           |where (active_type = '1' or active_type = '2')
王志伟's avatar
王志伟 committed
259 260 261 262 263 264
           |and first_channel_source_type not in ('yqxiu1','yqxiu2','yqxiu3','yqxiu4','yqxiu5','mxyc1','mxyc2','mxyc3'
           |    ,'wanpu','jinshan','jx','maimai','zhuoyi','huatian','suopingjingling','mocha','mizhe','meika','lamabang'
           |    ,'js-az1','js-az2','js-az3','js-az4','js-az5','jfq-az1','jfq-az2','jfq-az3','jfq-az4','jfq-az5','toufang1'
           |    ,'toufang2','toufang3','toufang4','toufang5','toufang6','TF-toufang1','TF-toufang2','TF-toufang3','TF-toufang4'
           |    ,'TF-toufang5','tf-toufang1','tf-toufang2','tf-toufang3','tf-toufang4','tf-toufang5','benzhan','promotion_aso100'
           |    ,'promotion_qianka','promotion_xiaoyu','promotion_dianru','promotion_malioaso','promotion_malioaso-shequ'
王志伟's avatar
王志伟 committed
265
           |    ,'promotion_shike','promotion_julang_jl03','','unknown','promotion_zuimei')
王志伟's avatar
王志伟 committed
266 267 268 269 270 271 272 273 274
           |and partition_date ='${partition_date}'
         """.stripMargin
      )
      devicee_id_newUser.show()
      devicee_id_newUser.createOrReplaceTempView("device_id_new")

      val clk_count_newUser_Contrast = sc.sql(
        s"""
           |select '${stat_date}' as stat_date, count(cid_id) as clk_count_newUser_Contrast
王志伟's avatar
王志伟 committed
275
           |from jerry_prod.data_feed_click jd inner join device_id_new
王志伟's avatar
王志伟 committed
276 277 278
           |on jd.device_id = device_id_new.device_id
           |where  (jd.cid_type = 'diary' or jd.cid_type = 'diary_video')
           |and jd.device_id regexp'1$$'
王志伟's avatar
王志伟 committed
279
           |and jd.device_id not in (select device_id from jerry_prod.blacklist)
王志伟's avatar
王志伟 committed
280 281 282
           |and jd.stat_date ='${stat_date}'
         """.stripMargin
      )
王志伟's avatar
王志伟 committed
283
      clk_count_newUser_Contrast.show()
王志伟's avatar
王志伟 committed
284 285 286 287

      val imp_count_newUser_Contrast = sc.sql(
        s"""
           |select '${stat_date}' as stat_date, count(cid_id) as imp_count_newUser_Contrast
王志伟's avatar
王志伟 committed
288
           |from jerry_prod.data_feed_exposure je inner join device_id_new
王志伟's avatar
王志伟 committed
289 290 291 292 293 294 295
           |on je.device_id = device_id_new.device_id
           |where je.cid_type = 'diary'
           |and je.device_id regexp'1$$'
           |and je.device_id not in (select device_id from blacklist)
           |and je.stat_date ='${stat_date}'
         """.stripMargin
      )
王志伟's avatar
王志伟 committed
296
      imp_count_newUser_Contrast.show()
王志伟's avatar
王志伟 committed
297 298 299 300

      val clk_count_newUser_all = sc.sql(
        s"""
           |select '${stat_date}' as stat_date, count(cid_id) as clk_count_newUser_all
王志伟's avatar
王志伟 committed
301
           |from jerry_prod.data_feed_click jd inner join device_id_new
王志伟's avatar
王志伟 committed
302 303
           |on jd.device_id = device_id_new.device_id
           |where  (jd.cid_type = 'diary' or jd.cid_type = 'diary_video')
王志伟's avatar
王志伟 committed
304
           |and jd.device_id not in (select device_id from jerry_prod.blacklist)
王志伟's avatar
王志伟 committed
305 306 307
           |and jd.stat_date ='${stat_date}'
         """.stripMargin
      )
王志伟's avatar
王志伟 committed
308
      clk_count_newUser_all.show()
王志伟's avatar
王志伟 committed
309 310 311 312

      val imp_count_newUser_all = sc.sql(
        s"""
           |select '${stat_date}' as stat_date, count(cid_id) as imp_count_newUser_all
王志伟's avatar
王志伟 committed
313
           |from jerry_prod.data_feed_exposure je inner join device_id_new
王志伟's avatar
王志伟 committed
314 315
           |on je.device_id = device_id_new.device_id
           |where je.cid_type = 'diary'
王志伟's avatar
王志伟 committed
316
           |and je.device_id not in (select device_id from jerry_prod.blacklist)
王志伟's avatar
王志伟 committed
317 318 319
           |and je.stat_date ='${stat_date}'
         """.stripMargin
      )
王志伟's avatar
王志伟 committed
320
      imp_count_newUser_all.show()
王志伟's avatar
王志伟 committed
321 322 323 324 325 326

      val result3 = clk_count_newUser_Contrast.join(imp_count_newUser_Contrast,"stat_date")
        .join(clk_count_newUser_all,"stat_date")
        .join(imp_count_newUser_all,"stat_date")
      result3.show()

王志伟's avatar
王志伟 committed
327
//      GmeiConfig.writeToJDBCTable(result3, "bug_Recommendation_strategy_newUser", SaveMode.Append)
王志伟's avatar
王志伟 committed
328 329 330
//      GmeiConfig.writeToJDBCTable("jdbc:mysql://152.136.44.138:4000/jerry_prod?user=root&password=3SYz54LS9#^9sBvC&rewriteBatchedStatements=true",result3, table="bug_Recommendation_strategy_newUser",SaveMode.Append)

      println("开始写入")
王志伟's avatar
王志伟 committed
331 332 333
//      GmeiConfig.writeToJDBCTable("jerry.jdbcuri",result3, table="bug_Recommendation_strategy_newUser",SaveMode.Append)
//      println("写入完成")
      GmeiConfig.writeToJDBCTable("jdbc:mysql://172.16.40.158:4000/jerry_prod?user=root&password=3SYz54LS9#^9sBvC&rewriteBatchedStatements=true",result3, table="bug_Recommendation_strategy_newUser",SaveMode.Append)
王志伟's avatar
王志伟 committed
334
      println("写入完成")
王志伟's avatar
王志伟 committed
335

王志伟's avatar
王志伟 committed
336

王志伟's avatar
王志伟 committed
337 338 339 340 341
    }


  }

王志伟's avatar
王志伟 committed
342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382
}





object CTR_precise {

  Logger.getLogger("org.apache.spark").setLevel(Level.WARN)
  Logger.getLogger("org.apache.eclipse.jetty.server").setLevel(Level.OFF)

  case class Params(env: String = "dev",
                    date: String = "2018-08-01"
                   ) extends AbstractParams[Params] with Serializable

  val defaultParams = Params()

  val parser = new OptionParser[Params]("Feed_EDA") {
    head("WeafareStat")
    opt[String]("env")
      .text(s"the databases environment you used")
      .action((x, c) => c.copy(env = x))
    opt[String] ("date")
      .text(s"the date you used")
      .action((x,c) => c.copy(date = x))
    note(
      """
        |For example, the following command runs this app on a tidb dataset:
        |
        | spark-submit --class com.gmei.WeafareStat ./target/scala-2.11/feededa-assembly-0.1.jar \
      """.stripMargin +
        s"|   --env ${defaultParams.env}"
    )
  }

  def main(args: Array[String]): Unit = {
    parser.parse(args, defaultParams).map { param =>
      GmeiConfig.setup(param.env)
      val spark_env = GmeiConfig.getSparkSession()
      val sc = spark_env._2

王志伟's avatar
王志伟 committed
383 384 385 386 387 388 389
//      val ti = new TiContext(sc)
      sc.sql("use jerry_prod")
//      ti.tidbMapTable(dbName = "jerry_prod", tableName = "data_feed_exposure_precise")
//      ti.tidbMapTable(dbName = "jerry_prod", tableName = "data_feed_click")
//      ti.tidbMapTable(dbName = "jerry_prod", tableName = "blacklist")
//      ti.tidbMapTable(dbName = "jerry_prod", tableName = "data_feed_exposure")
//      ti.tidbMapTable(dbName = "jerry_prod", tableName = "merge_queue_table")
王志伟's avatar
王志伟 committed
390 391


王志伟's avatar
王志伟 committed
392 393
      val stat_date = GmeiConfig.getMinusNDate(1)
//      val stat_date = param.date
王志伟's avatar
王志伟 committed
394 395 396 397 398 399 400 401 402 403 404 405 406
      //println(param.date)
      val partition_date = stat_date.replace("-","")
      val decive_id_oldUser = sc.sql(
        s"""
           |select distinct(device_id) as device_id
           |from online.ml_device_day_active_status
           |where active_type = '4'
           |and first_channel_source_type not in ('yqxiu1','yqxiu2','yqxiu3','yqxiu4','yqxiu5','mxyc1','mxyc2','mxyc3'
           |    ,'wanpu','jinshan','jx','maimai','zhuoyi','huatian','suopingjingling','mocha','mizhe','meika','lamabang'
           |    ,'js-az1','js-az2','js-az3','js-az4','js-az5','jfq-az1','jfq-az2','jfq-az3','jfq-az4','jfq-az5','toufang1'
           |    ,'toufang2','toufang3','toufang4','toufang5','toufang6','TF-toufang1','TF-toufang2','TF-toufang3','TF-toufang4'
           |    ,'TF-toufang5','tf-toufang1','tf-toufang2','tf-toufang3','tf-toufang4','tf-toufang5','benzhan','promotion_aso100'
           |    ,'promotion_qianka','promotion_xiaoyu','promotion_dianru','promotion_malioaso','promotion_malioaso-shequ'
王志伟's avatar
王志伟 committed
407
           |    ,'promotion_shike','promotion_julang_jl03','','unknown','promotion_zuimei')
王志伟's avatar
王志伟 committed
408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465
           |and partition_date ='${partition_date}'
         """.stripMargin
      )
      decive_id_oldUser.createOrReplaceTempView("device_id_old")


      val clk_count_oldUser_Contrast = sc.sql(
        s"""
           |select '${stat_date}' as stat_date, count(cid_id) as clk_count_oldUser_Contrast
           |from data_feed_click jd inner join device_id_old
           |on jd.device_id = device_id_old.device_id
           |where  (jd.cid_type = 'diary' or jd.cid_type = 'diary_video')
           |and jd.device_id regexp'1$$'
           |and jd.device_id not in (select device_id from blacklist)
           |and jd.stat_date ='${stat_date}'
         """.stripMargin
      )

      val imp_count_oldUser_Contrast = sc.sql(
        s"""
           |select '${stat_date}' as stat_date, count(cid_id) as imp_count_oldUser_Contrast
           |from data_feed_exposure_precise je inner join device_id_old
           |on je.device_id = device_id_old.device_id
           |where je.cid_type = 'diary'
           |and je.device_id regexp'1$$'
           |and je.device_id not in (select device_id from blacklist)
           |and je.stat_date ='${stat_date}'
         """.stripMargin
      )

      val clk_count_oldUser_all = sc.sql(
        s"""
           |select '${stat_date}' as stat_date, count(cid_id) as clk_count_oldUser_all
           |from data_feed_click jd inner join device_id_old
           |on jd.device_id = device_id_old.device_id
           |where  (jd.cid_type = 'diary' or jd.cid_type = 'diary_video')
           |and jd.device_id not in (select device_id from blacklist)
           |and jd.stat_date ='${stat_date}'
         """.stripMargin
      )

      val imp_count_oldUser_all = sc.sql(
        s"""
           |select '${stat_date}' as stat_date, count(cid_id) as imp_count_oldUser_all
           |from data_feed_exposure_precise je inner join device_id_old
           |on je.device_id = device_id_old.device_id
           |where je.cid_type = 'diary'
           |and je.device_id not in (select device_id from blacklist)
           |and je.stat_date ='${stat_date}'
         """.stripMargin
      )


      val result1 = clk_count_oldUser_Contrast.join(imp_count_oldUser_Contrast,"stat_date")
        .join(clk_count_oldUser_all,"stat_date")
        .join(imp_count_oldUser_all,"stat_date")
      result1.show()

王志伟's avatar
王志伟 committed
466 467 468
//      GmeiConfig.writeToJDBCTable("jdbc:mysql://152.136.44.138:4000/jerry_prod?user=root&password=3SYz54LS9#^9sBvC&rewriteBatchedStatements=true",result1, table="bug_precise_Recommendation_strategy_temp",SaveMode.Append)

      println("开始写入")
王志伟's avatar
王志伟 committed
469 470 471 472
//      GmeiConfig.writeToJDBCTable("jerry.jdbcuri",result1, table="bug_precise_Recommendation_strategy_temp",SaveMode.Append)
//      println("写入完成")

      GmeiConfig.writeToJDBCTable("jdbc:mysql://172.16.40.158:4000/jerry_prod?user=root&password=3SYz54LS9#^9sBvC&rewriteBatchedStatements=true",result1, table="bug_precise_Recommendation_strategy_temp",SaveMode.Append)
王志伟's avatar
王志伟 committed
473
      println("写入完成")
王志伟's avatar
王志伟 committed
474

王志伟's avatar
王志伟 committed
475
//      GmeiConfig.writeToJDBCTable(result1, "bug_precise_Recommendation_strategy_temp", SaveMode.Append)
王志伟's avatar
王志伟 committed
476 477 478 479 480 481

      //统计新用户点击率
      val devicee_id_newUser = sc.sql(
        s"""
           |select distinct(device_id) as device_id
           |from online.ml_device_day_active_status
王志伟's avatar
王志伟 committed
482
           |where (active_type = '1' or active_type = '2')
王志伟's avatar
王志伟 committed
483 484 485 486 487 488
           |and first_channel_source_type not in ('yqxiu1','yqxiu2','yqxiu3','yqxiu4','yqxiu5','mxyc1','mxyc2','mxyc3'
           |    ,'wanpu','jinshan','jx','maimai','zhuoyi','huatian','suopingjingling','mocha','mizhe','meika','lamabang'
           |    ,'js-az1','js-az2','js-az3','js-az4','js-az5','jfq-az1','jfq-az2','jfq-az3','jfq-az4','jfq-az5','toufang1'
           |    ,'toufang2','toufang3','toufang4','toufang5','toufang6','TF-toufang1','TF-toufang2','TF-toufang3','TF-toufang4'
           |    ,'TF-toufang5','tf-toufang1','tf-toufang2','tf-toufang3','tf-toufang4','tf-toufang5','benzhan','promotion_aso100'
           |    ,'promotion_qianka','promotion_xiaoyu','promotion_dianru','promotion_malioaso','promotion_malioaso-shequ'
王志伟's avatar
王志伟 committed
489
           |    ,'promotion_shike','promotion_julang_jl03','','unknown','promotion_zuimei')
王志伟's avatar
王志伟 committed
490 491 492 493 494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537 538 539 540 541 542 543 544 545 546
           |and partition_date ='${partition_date}'
         """.stripMargin
      )
      devicee_id_newUser.show()
      devicee_id_newUser.createOrReplaceTempView("device_id_new")

      val clk_count_newUser_Contrast = sc.sql(
        s"""
           |select '${stat_date}' as stat_date, count(cid_id) as clk_count_newUser_Contrast
           |from data_feed_click jd inner join device_id_new
           |on jd.device_id = device_id_new.device_id
           |where  (jd.cid_type = 'diary' or jd.cid_type = 'diary_video')
           |and jd.device_id regexp'1$$'
           |and jd.device_id not in (select device_id from blacklist)
           |and jd.stat_date ='${stat_date}'
         """.stripMargin
      )

      val imp_count_newUser_Contrast = sc.sql(
        s"""
           |select '${stat_date}' as stat_date, count(cid_id) as imp_count_newUser_Contrast
           |from data_feed_exposure_precise je inner join device_id_new
           |on je.device_id = device_id_new.device_id
           |where je.cid_type = 'diary'
           |and je.device_id regexp'1$$'
           |and je.device_id not in (select device_id from blacklist)
           |and je.stat_date ='${stat_date}'
         """.stripMargin
      )

      val clk_count_newUser_all = sc.sql(
        s"""
           |select '${stat_date}' as stat_date, count(cid_id) as clk_count_newUser_all
           |from data_feed_click jd inner join device_id_new
           |on jd.device_id = device_id_new.device_id
           |where  (jd.cid_type = 'diary' or jd.cid_type = 'diary_video')
           |and jd.device_id not in (select device_id from blacklist)
           |and jd.stat_date ='${stat_date}'
         """.stripMargin
      )

      val imp_count_newUser_all = sc.sql(
        s"""
           |select '${stat_date}' as stat_date, count(cid_id) as imp_count_newUser_all
           |from data_feed_exposure_precise je inner join device_id_new
           |on je.device_id = device_id_new.device_id
           |where je.cid_type = 'diary'
           |and je.device_id not in (select device_id from blacklist)
           |and je.stat_date ='${stat_date}'
         """.stripMargin
      )

      val result3 = clk_count_newUser_Contrast.join(imp_count_newUser_Contrast,"stat_date")
        .join(clk_count_newUser_all,"stat_date")
        .join(imp_count_newUser_all,"stat_date")
      result3.show()

王志伟's avatar
王志伟 committed
547
//      GmeiConfig.writeToJDBCTable(result3, "bug_precise_Recommendation_strategy_newUser", SaveMode.Append)
王志伟's avatar
王志伟 committed
548 549 550
//      GmeiConfig.writeToJDBCTable("jdbc:mysql://152.136.44.138:4000/jerry_prod?user=root&password=3SYz54LS9#^9sBvC&rewriteBatchedStatements=true",result3, table="bug_precise_Recommendation_strategy_newUser",SaveMode.Append)

      println("开始写入")
王志伟's avatar
王志伟 committed
551 552 553
//      GmeiConfig.writeToJDBCTable("jerry.jdbcuri",result3, table="bug_precise_Recommendation_strategy_newUser",SaveMode.Append)
//      println("写入完成")
      GmeiConfig.writeToJDBCTable("jdbc:mysql://172.16.40.158:4000/jerry_prod?user=root&password=3SYz54LS9#^9sBvC&rewriteBatchedStatements=true",result3, table="bug_precise_Recommendation_strategy_newUser",SaveMode.Append)
王志伟's avatar
王志伟 committed
554
      println("写入完成")
王志伟's avatar
王志伟 committed
555

王志伟's avatar
王志伟 committed
556 557 558 559 560 561

    }


  }

562 563
}