start_task.py 2.56 KB
# -*- coding:UTF-8 -*-
# @Time  : 2020/8/20 17:20
# @File  : start_task.py
# @email : litao@igengmei.com
# @author : litao

import subprocess
import datetime
# from pyhive import hive

conent_detail_page_grayscale_ctr_str = '/opt/spark/bin/spark-submit --master yarn --deploy-mode client --queue root.strategy --driver-memory 16g --executor-memory 1g --executor-cores 1 --num-executors 70 --conf spark.default.parallelism=100 --conf spark.storage.memoryFraction=0.5 --conf spark.shuffle.memoryFraction=0.3 --conf spark.executorEnv.LD_LIBRARY_PATH="/opt/java/jdk1.8.0_181/jre/lib/amd64/server:/opt/cloudera/parcels/CDH-5.16.1-1.cdh5.16.1.p0.3/lib64" --conf spark.locality.wait=0 --jars /srv/apps/tispark-core-2.1-SNAPSHOT-jar-with-dependencies.jar,/srv/apps/spark-connector_2.11-1.9.0-rc2.jar,/srv/apps/mysql-connector-java-5.1.38.jar /srv/apps/meta_base_code/task/conent_detail_page_grayscale_ctr.py\n'
recommend_strategy_d_str = '/opt/spark/bin/spark-submit --master yarn --deploy-mode client --queue root.strategy --driver-memory 16g --executor-memory 1g --executor-cores 1 --num-executors 70 --conf spark.default.parallelism=100 --conf spark.storage.memoryFraction=0.5 --conf spark.shuffle.memoryFraction=0.3 --conf spark.executorEnv.LD_LIBRARY_PATH="/opt/java/jdk1.8.0_181/jre/lib/amd64/server:/opt/cloudera/parcels/CDH-5.16.1-1.cdh5.16.1.p0.3/lib64" --conf spark.locality.wait=0 --jars /srv/apps/tispark-core-2.1-SNAPSHOT-jar-with-dependencies.jar,/srv/apps/spark-connector_2.11-1.9.0-rc2.jar,/srv/apps/mysql-connector-java-5.1.38.jar /srv/apps/meta_base_code/task/recommend_strategy_d.py\n'


hive_host = "bj-gm-prod-cos-datacenter003"
hive_port = 10000
hive_username = "strategy"
hive_database = "online"

# conn = hive.Connection(host=hive_host, port=hive_port, username=hive_username, database=hive_database)
# cursor = conn.cursor()

table_1 = "pm.tl_pm_recommend_strategy_d"


# def if_write_data(table):
#     now = datetime.datetime.now() - datetime.timedelta(days=1)
#     date_str = now.strftime("%Y%m%d")
#     sql_str = "select count(*) from {0} where day_id = {1}".format(table,date_str)
#     res = cursor.fetchall(sql_str)
#     print(res)
#     if res:
#         return True
#     else:
#         return False



def func_cal_task(task_str):
    sub_str = "source /srv/envs/esmm/bin/activate\n"
    print(sub_str)
    sub_str += task_str
    subprocess.run(sub_str, shell=True)



if __name__ == "__main__":
    # func_cal_task()
    # print(if_write_data(table_1))
    # cursor.close()
    # conn.close()
    func_cal_task(recommend_strategy_d_str)
    func_cal_task(conent_detail_page_grayscale_ctr_str)