Commit 965afc8e authored by litaolemo's avatar litaolemo

update

parent b0e50fdb
...@@ -28,9 +28,10 @@ from pyspark.sql.functions import lit ...@@ -28,9 +28,10 @@ from pyspark.sql.functions import lit
import pytispark.pytispark as pti import pytispark.pytispark as pti
db = pymysql.connect(host='172.16.40.158', port=4000, user='st_user', passwd='aqpuBLYzEV7tML5RPsN1pntUzFy', db = pymysql.connect(host='172.16.40.158', port=4000, user='st_user', passwd='aqpuBLYzEV7tML5RPsN1pntUzFy',
db='jerry_prod') db='jerry_prod')
cursor = db.cursor() cursor = db.cursor()
def con_sql(sql): def con_sql(sql):
# 从数据库的表里获取数据 # 从数据库的表里获取数据
...@@ -78,17 +79,11 @@ spark.sql("CREATE TEMPORARY FUNCTION json_map AS 'brickhouse.udf.json.JsonMapUDF ...@@ -78,17 +79,11 @@ spark.sql("CREATE TEMPORARY FUNCTION json_map AS 'brickhouse.udf.json.JsonMapUDF
spark.sql("CREATE TEMPORARY FUNCTION is_json AS 'com.gmei.hive.common.udf.UDFJsonFormatCheck'") spark.sql("CREATE TEMPORARY FUNCTION is_json AS 'com.gmei.hive.common.udf.UDFJsonFormatCheck'")
spark.sql("CREATE TEMPORARY FUNCTION arrayMerge AS 'com.gmei.hive.common.udf.UDFArryMerge'") spark.sql("CREATE TEMPORARY FUNCTION arrayMerge AS 'com.gmei.hive.common.udf.UDFArryMerge'")
ungrey_select_sql = """SELECT *,NVL(ROUND(wel_click_pv/wel_exp_pv,6),0) as meigou_ctr, grey_select_sql = """SELECT *,NVL(ROUND((navbar_search+highlight_word+self_welfare_card+recommend_welfare_card+recommend_content_card*0.2+transfer_card+video_consultation)/card_exposure,5),0) as recommend_ctr,
NVL(ROUND(content_click_pv/content_exp_pv,6),0) as neirong_ctr FROM pm.tl_pm_contentpage_ctr where grey_type = '非灰'""" NVL(ROUND(card_click/card_exposure,5),0) as click_ctr,
ungrey_df = spark.sql(ungrey_select_sql) NVL(ROUND((navbar_search+highlight_word+self_welfare_card+recommend_welfare_card+recommend_content_card*0.2+transfer_card+video_consultation)/card_click,5),0) as second_jump_ctr, FROM pm.tl_pm_recommend_strategy_d"""
ungrey_df.createOrReplaceTempView("ungrey") device_df = spark.sql(grey_select_sql)
grey_select_sql = """SELECT *,NVL(ROUND(wel_click_pv/wel_exp_pv,6),0) as grey_meigou_ctr,
NVL(ROUND(content_click_pv/content_exp_pv,6),0) as grey_neirong_ctr FROM pm.tl_pm_contentpage_ctr where grey_type = '灰度'"""
grey_df = spark.sql(grey_select_sql)
grey_df.createOrReplaceTempView("grey")
sql = """SELECT *,ungrey.meigou_ctr,ungrey.neirong_ctr from grey"""
device_df.show(1, False) device_df.show(1, False)
sql_res = device_df.collect() sql_res = device_df.collect()
print("-----------------------------------------------------------------------------") print("-----------------------------------------------------------------------------")
...@@ -97,30 +92,39 @@ for res in sql_res: ...@@ -97,30 +92,39 @@ for res in sql_res:
day_id = res.day_id day_id = res.day_id
device_os_type = res.device_os_type device_os_type = res.device_os_type
active_type = res.active_type active_type = res.active_type
grey_type = res.grey_type card_content_type = res.card_content_type
page_name = res.page_name recommend_type = res.recommend_type
content_pv = res.content_pv card_click = res.card_click
content_uv = res.content_uv card_exposure = res.card_exposure
wel_exp_pv = res.wel_exp_pv avg_page_stay = res.avg_page_stay
content_exp_pv = res.content_exp_pv navbar_search = res.navbar_search
meigou_ctr=res.meigou_ctr highlight_word = res.highlight_word
neirong_ctr=res.neirong_ctr self_welfare_card = res.self_welfare_card
wel_click_pv = res.wel_click_pv recommend_welfare_card = res.recommend_welfare_card
content_click_pv = res.content_click_pv recommend_content_card = res.recommend_content_card
slide_wel_click_pv = res.slide_wel_click_pv recommend_special_card = res.recommend_special_card
self_wel_click_pv = res.self_wel_click_pv transfer_card = res.transfer_card
partition_day = res.PARTITION_DAY video_consultation = res.video_consultation
pid = hashlib.md5((day_id + device_os_type + active_type + grey_type + page_name).encode("utf8")).hexdigest() partition_day = res.partition_day
instert_sql = """replace into conent_detail_page_grayscale_ctr( recommend_ctr = res.recommend_ctr
day_id,device_os_type,active_type,grey_type,page_name,content_pv,content_uv,wel_exp_pv, second_jump_ctr = res.second_jump_ctr
content_exp_pv,wel_click_pv,content_click_pv,slide_wel_click_pv,self_wel_click_pv,partition_day,pid,meigou_ctr,neirong_ctr click_ctr = res.click_ctr
) VALUES('{day_id}','{device_os_type}','{active_type}','{grey_type}','{page_name}',{content_pv},{content_uv}, pid = hashlib.md5((day_id + device_os_type + active_type + card_content_type + recommend_type).encode("utf8")).hexdigest()
{wel_exp_pv},{content_exp_pv},{wel_click_pv},{content_click_pv},{slide_wel_click_pv},{self_wel_click_pv},'{partition_day}','{pid}',{meigou_ctr},{neirong_ctr});""".format( instert_sql = """replace into recommend_strategy_d(
day_id=day_id,device_os_type=device_os_type,active_type=active_type,grey_type=grey_type,page_name=page_name, day_id,device_os_type,active_type,card_content_type,recommend_type,card_click,card_exposure,avg_page_stay,navbar_search,
content_pv=content_pv,content_uv=content_uv,wel_exp_pv=wel_exp_pv,content_exp_pv=content_exp_pv,wel_click_pv=wel_click_pv, highlight_word,self_welfare_card,recommend_welfare_card,recommend_content_card,recommend_special_card,transfer_card,video_consultation,
content_click_pv=content_click_pv,slide_wel_click_pv=slide_wel_click_pv,self_wel_click_pv=self_wel_click_pv,meigou_ctr=meigou_ctr,neirong_ctr=neirong_ctr, partition_day,pid,recommend_ctr,second_jump_ctr,click_ctr
partition_day=partition_day, pid=pid ) VALUES('{day_id}','{device_os_type}','{active_type}','{card_content_type}','{recommend_type}',{card_click},{card_exposure},
{avg_page_stay},{navbar_search},{self_welfare_card},{recommend_welfare_card},{recommend_content_card},{recommend_special_card},
{transfer_card},{video_consultation},'{partition_day}','{pid}',{recommend_ctr},{second_jump_ctr},{click_ctr});""".format(
day_id=day_id, device_os_type=device_os_type, active_type=active_type, card_content_type=card_content_type,
card_click=card_click, recommend_type=recommend_type, card_exposure=card_exposure, avg_page_stay=avg_page_stay,
navbar_search=navbar_search, self_welfare_card=self_welfare_card, recommend_welfare_card=recommend_welfare_card,
recommend_content_card=recommend_content_card, recommend_special_card=recommend_special_card,
transfer_card=transfer_card,
video_consultation=video_consultation, partition_day=partition_day, pid=pid, recommend_ctr=recommend_ctr,
second_jump_ctr=second_jump_ctr, click_ctr=click_ctr
) )
print(instert_sql) print(instert_sql)
# cursor.execute("set names 'UTF8'") # cursor.execute("set names 'UTF8'")
...@@ -128,4 +132,4 @@ for res in sql_res: ...@@ -128,4 +132,4 @@ for res in sql_res:
db.commit() db.commit()
print(res) print(res)
# cursor.executemany() # cursor.executemany()
db.close() db.close()
\ No newline at end of file
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment