submit.sh 4.22 KB
Newer Older
高雅喆's avatar
高雅喆 committed
1
#! /bin/bash
高雅喆's avatar
高雅喆 committed
2 3 4

cd /srv/apps/ffm-baseline/eda/esmm
git checkout master
高雅喆's avatar
高雅喆 committed
5 6
PYTHON_PATH=/home/gaoyazhe/miniconda3/bin/python
MODEL_PATH=/srv/apps/ffm-baseline/eda/esmm
7
DATA_PATH=/home/gmuser/esmm_data
高雅喆's avatar
高雅喆 committed
8

高雅喆's avatar
高雅喆 committed
9
echo "start time"
高雅喆's avatar
高雅喆 committed
10 11 12
current=$(date "+%Y-%m-%d %H:%M:%S")
timeStamp=$(date -d "$current" +%s)
currentTimeStamp=$((timeStamp*1000+`date "+%N"`/1000000))
高雅喆's avatar
高雅喆 committed
13
echo $current
高雅喆's avatar
高雅喆 committed
14 15

echo "rm leave tfrecord"
高雅喆's avatar
高雅喆 committed
16 17 18 19
rm ${DATA_PATH}/tr/*
rm ${DATA_PATH}/va/*
rm ${DATA_PATH}/native/*
rm ${DATA_PATH}/nearby/*
高雅喆's avatar
高雅喆 committed
20
rm -r ${DATA_PATH}/model_ckpt/DeepCvrMTL/201*
高雅喆's avatar
高雅喆 committed
21

高雅喆's avatar
高雅喆 committed
22
echo "data2ffm"
高雅喆's avatar
高雅喆 committed
23
${PYTHON_PATH} ${MODEL_PATH}/Feature_pipline/data2ffm.py > ${DATA_PATH}/infer.log
高雅喆's avatar
高雅喆 committed
24

高雅喆's avatar
高雅喆 committed
25
all_sample=$((`cat ${DATA_PATH}/tr.csv | awk -F '\t' '{print$5}' | awk -F ',' '{print$2$3$4}' | sort | uniq | wc -l`))
26 27 28
  uniq_feat=$((`cat ${DATA_PATH}/tr.csv | awk -F '\t' '{print$5}' | awk -F ',' '{print$4}' | sort | uniq -u | wc -l`))
  repe_feat=$((all_sample-uniq_feat))
  echo "Bayes Error Rate": $((repe_feat*100/all_sample))%
高雅喆's avatar
高雅喆 committed
29

高雅喆's avatar
高雅喆 committed
30
echo "split data"
高雅喆's avatar
高雅喆 committed
31 32
split -l $((`wc -l < ${DATA_PATH}/tr.csv`/15)) ${DATA_PATH}/tr.csv -d -a 4 ${DATA_PATH}/tr/tr_ --additional-suffix=.csv
split -l $((`wc -l < ${DATA_PATH}/va.csv`/5)) ${DATA_PATH}/va.csv -d -a 4 ${DATA_PATH}/va/va_ --additional-suffix=.csv
33
split -l $((`wc -l < ${DATA_PATH}/native.csv`/15)) ${DATA_PATH}/native.csv -d -a 4 ${DATA_PATH}/native/native_ --additional-suffix=.csv
高雅喆's avatar
高雅喆 committed
34
split -l $((`wc -l < ${DATA_PATH}/nearby.csv`/5)) ${DATA_PATH}/nearby.csv -d -a 4 ${DATA_PATH}/nearby/nearby_ --additional-suffix=.csv
高雅喆's avatar
高雅喆 committed
35 36

echo "csv to tfrecord"
高雅喆's avatar
高雅喆 committed
37 38 39 40
${PYTHON_PATH} ${MODEL_PATH}/Feature_pipline/get_tfrecord.py --input_dir=${DATA_PATH}/tr/ --output_dir=${DATA_PATH}/tr/
${PYTHON_PATH} ${MODEL_PATH}/Feature_pipline/get_tfrecord.py --input_dir=${DATA_PATH}/va/ --output_dir=${DATA_PATH}/va/
${PYTHON_PATH} ${MODEL_PATH}/Feature_pipline/get_tfrecord.py --input_dir=${DATA_PATH}/native/ --output_dir=${DATA_PATH}/native/
${PYTHON_PATH} ${MODEL_PATH}/Feature_pipline/get_tfrecord.py --input_dir=${DATA_PATH}/nearby/ --output_dir=${DATA_PATH}/nearby/
高雅喆's avatar
高雅喆 committed
41

高雅喆's avatar
高雅喆 committed
42 43 44 45
cat ${DATA_PATH}/tr/*.tfrecord > ${DATA_PATH}/tr/tr.tfrecord
cat ${DATA_PATH}/va/*.tfrecord > ${DATA_PATH}/va/va.tfrecord
cat ${DATA_PATH}/native/*.tfrecord > ${DATA_PATH}/native/native.tfrecord
cat ${DATA_PATH}/nearby/*.tfrecord > ${DATA_PATH}/nearby/nearby.tfrecord
高雅喆's avatar
高雅喆 committed
46

高雅喆's avatar
高雅喆 committed
47 48 49 50
rm ${DATA_PATH}/tr/tr_*
rm ${DATA_PATH}/va/va_*
rm ${DATA_PATH}/native/native_*
rm ${DATA_PATH}/nearby/nearby_*
高雅喆's avatar
高雅喆 committed
51

高雅喆's avatar
高雅喆 committed
52
echo "data transform time"
高雅喆's avatar
高雅喆 committed
53 54 55
current=$(date "+%Y-%m-%d %H:%M:%S")
timeStamp=$(date -d "$current" +%s)
currentTimeStamp=$((timeStamp*1000+`date "+%N"`/1000000))
高雅喆's avatar
高雅喆 committed
56
echo $current
高雅喆's avatar
高雅喆 committed
57

高雅喆's avatar
高雅喆 committed
58
echo "train..."
高雅喆's avatar
高雅喆 committed
59
${PYTHON_PATH} ${MODEL_PATH}/Model_pipline/DeepCvrMTL.py --ctr_task_wgt=0.3 --learning_rate=0.0001 --deep_layers=256,128 --dropout=0.8,0.5 --optimizer=Adam --num_epochs=1 --embedding_size=16 --batch_size=1024 --field_size=8 --feature_size=2000 --l2_reg=0.005 --log_steps=100 --num_threads=36 --model_dir=${DATA_PATH}/model_ckpt/DeepCvrMTL/ --data_dir=${DATA_PATH} --task_type=train
高雅喆's avatar
高雅喆 committed
60

高雅喆's avatar
高雅喆 committed
61
echo "train time"
高雅喆's avatar
高雅喆 committed
62 63 64
current=$(date "+%Y-%m-%d %H:%M:%S")
timeStamp=$(date -d "$current" +%s)
currentTimeStamp=$((timeStamp*1000+`date "+%N"`/1000000))
高雅喆's avatar
高雅喆 committed
65
echo $current
高雅喆's avatar
高雅喆 committed
66 67

echo "infer native..."
高雅喆's avatar
高雅喆 committed
68
${PYTHON_PATH} ${MODEL_PATH}/Model_pipline/DeepCvrMTL.py --ctr_task_wgt=0.3 --learning_rate=0.0001 --deep_layers=256,128 --dropout=0.8,0.5 --optimizer=Adam --num_epochs=1 --embedding_size=16 --batch_size=1024 --field_size=8 --feature_size=2000 --l2_reg=0.005 --log_steps=100 --num_threads=36 --model_dir=${DATA_PATH}/model_ckpt/DeepCvrMTL/ --data_dir=${DATA_PATH}/native --task_type=infer > ${DATA_PATH}/infer.log
高雅喆's avatar
高雅喆 committed
69 70 71


echo "infer nearby..."
高雅喆's avatar
高雅喆 committed
72
${PYTHON_PATH} ${MODEL_PATH}/Model_pipline/DeepCvrMTL.py --ctr_task_wgt=0.3 --learning_rate=0.0001 --deep_layers=256,128 --dropout=0.8,0.5 --optimizer=Adam --num_epochs=1 --embedding_size=16 --batch_size=1024 --field_size=8 --feature_size=2000 --l2_reg=0.005 --log_steps=100 --num_threads=36 --model_dir=${DATA_PATH}/model_ckpt/DeepCvrMTL/ --data_dir=${DATA_PATH}/nearby --task_type=infer > ${DATA_PATH}/infer.log
高雅喆's avatar
高雅喆 committed
73 74

echo "sort and 2sql"
高雅喆's avatar
高雅喆 committed
75
${PYTHON_PATH} ${MODEL_PATH}/Model_pipline/sort_and_2sql.py
高雅喆's avatar
高雅喆 committed
76

高雅喆's avatar
高雅喆 committed
77
echo "infer and sort and 2sql time"
高雅喆's avatar
高雅喆 committed
78 79 80
current=$(date "+%Y-%m-%d %H:%M:%S")
timeStamp=$(date -d "$current" +%s)
currentTimeStamp=$((timeStamp*1000+`date "+%N"`/1000000))
高雅喆's avatar
高雅喆 committed
81
echo $current
高雅喆's avatar
高雅喆 committed
82 83

${PYTHON_PATH} ${MODEL_PATH}/Model_pipline/send_mail.py