submit.sh 4.16 KB
Newer Older
高雅喆's avatar
高雅喆 committed
1
#! /bin/bash
高雅喆's avatar
高雅喆 committed
2 3 4
PYTHON_PATH=/home/gaoyazhe/miniconda3/bin/python
MODEL_PATH=/srv/apps/ffm-baseline/eda/esmm
DATA_PATH=/home/gaoyazhe/data
高雅喆's avatar
高雅喆 committed
5

高雅喆's avatar
高雅喆 committed
6
echo "start time"
高雅喆's avatar
高雅喆 committed
7 8 9
current=$(date "+%Y-%m-%d %H:%M:%S")
timeStamp=$(date -d "$current" +%s)
currentTimeStamp=$((timeStamp*1000+`date "+%N"`/1000000))
高雅喆's avatar
高雅喆 committed
10
echo $current
高雅喆's avatar
高雅喆 committed
11 12

echo "rm leave tfrecord"
高雅喆's avatar
高雅喆 committed
13 14 15 16
rm ${DATA_PATH}/tr/*
rm ${DATA_PATH}/va/*
rm ${DATA_PATH}/native/*
rm ${DATA_PATH}/nearby/*
高雅喆's avatar
高雅喆 committed
17
rm -r ${DATA_PATH}/model_ckpt/DeepCvrMTL/201*
高雅喆's avatar
高雅喆 committed
18

高雅喆's avatar
高雅喆 committed
19
echo "data2ffm"
高雅喆's avatar
高雅喆 committed
20
${PYTHON_PATH} ${MODEL_PATH}/Feature_pipline/data2ffm.py > ${DATA_PATH}/infer.log
高雅喆's avatar
高雅喆 committed
21

高雅喆's avatar
高雅喆 committed
22
all_sample=$((`cat ${DATA_PATH}/tr.csv | awk -F '\t' '{print$5}' | awk -F ',' '{print$2$3$4}' | sort | uniq | wc -l`))
23 24 25
  uniq_feat=$((`cat ${DATA_PATH}/tr.csv | awk -F '\t' '{print$5}' | awk -F ',' '{print$4}' | sort | uniq -u | wc -l`))
  repe_feat=$((all_sample-uniq_feat))
  echo "Bayes Error Rate": $((repe_feat*100/all_sample))%
高雅喆's avatar
高雅喆 committed
26

高雅喆's avatar
高雅喆 committed
27
echo "split data"
高雅喆's avatar
高雅喆 committed
28 29
split -l $((`wc -l < ${DATA_PATH}/tr.csv`/15)) ${DATA_PATH}/tr.csv -d -a 4 ${DATA_PATH}/tr/tr_ --additional-suffix=.csv
split -l $((`wc -l < ${DATA_PATH}/va.csv`/5)) ${DATA_PATH}/va.csv -d -a 4 ${DATA_PATH}/va/va_ --additional-suffix=.csv
30
split -l $((`wc -l < ${DATA_PATH}/native.csv`/15)) ${DATA_PATH}/native.csv -d -a 4 ${DATA_PATH}/native/native_ --additional-suffix=.csv
高雅喆's avatar
高雅喆 committed
31
split -l $((`wc -l < ${DATA_PATH}/nearby.csv`/5)) ${DATA_PATH}/nearby.csv -d -a 4 ${DATA_PATH}/nearby/nearby_ --additional-suffix=.csv
高雅喆's avatar
高雅喆 committed
32 33

echo "csv to tfrecord"
高雅喆's avatar
高雅喆 committed
34 35 36 37
${PYTHON_PATH} ${MODEL_PATH}/Feature_pipline/get_tfrecord.py --input_dir=${DATA_PATH}/tr/ --output_dir=${DATA_PATH}/tr/
${PYTHON_PATH} ${MODEL_PATH}/Feature_pipline/get_tfrecord.py --input_dir=${DATA_PATH}/va/ --output_dir=${DATA_PATH}/va/
${PYTHON_PATH} ${MODEL_PATH}/Feature_pipline/get_tfrecord.py --input_dir=${DATA_PATH}/native/ --output_dir=${DATA_PATH}/native/
${PYTHON_PATH} ${MODEL_PATH}/Feature_pipline/get_tfrecord.py --input_dir=${DATA_PATH}/nearby/ --output_dir=${DATA_PATH}/nearby/
高雅喆's avatar
高雅喆 committed
38

高雅喆's avatar
高雅喆 committed
39 40 41 42
cat ${DATA_PATH}/tr/*.tfrecord > ${DATA_PATH}/tr/tr.tfrecord
cat ${DATA_PATH}/va/*.tfrecord > ${DATA_PATH}/va/va.tfrecord
cat ${DATA_PATH}/native/*.tfrecord > ${DATA_PATH}/native/native.tfrecord
cat ${DATA_PATH}/nearby/*.tfrecord > ${DATA_PATH}/nearby/nearby.tfrecord
高雅喆's avatar
高雅喆 committed
43

高雅喆's avatar
高雅喆 committed
44 45 46 47
rm ${DATA_PATH}/tr/tr_*
rm ${DATA_PATH}/va/va_*
rm ${DATA_PATH}/native/native_*
rm ${DATA_PATH}/nearby/nearby_*
高雅喆's avatar
高雅喆 committed
48

高雅喆's avatar
高雅喆 committed
49
echo "data transform time"
高雅喆's avatar
高雅喆 committed
50 51 52
current=$(date "+%Y-%m-%d %H:%M:%S")
timeStamp=$(date -d "$current" +%s)
currentTimeStamp=$((timeStamp*1000+`date "+%N"`/1000000))
高雅喆's avatar
高雅喆 committed
53
echo $current
高雅喆's avatar
高雅喆 committed
54

高雅喆's avatar
高雅喆 committed
55
echo "train..."
高雅喆's avatar
高雅喆 committed
56
${PYTHON_PATH} ${MODEL_PATH}/Model_pipline/DeepCvrMTL.py --ctr_task_wgt=0.3 --learning_rate=0.0001 --deep_layers=256,128 --dropout=0.8,0.5 --optimizer=Adam --num_epochs=1 --embedding_size=16 --batch_size=1024 --field_size=8 --feature_size=2000 --l2_reg=0.005 --log_steps=100 --num_threads=36 --model_dir=${DATA_PATH}/model_ckpt/DeepCvrMTL/ --data_dir=${DATA_PATH} --task_type=train
高雅喆's avatar
高雅喆 committed
57

高雅喆's avatar
高雅喆 committed
58
echo "train time"
高雅喆's avatar
高雅喆 committed
59 60 61
current=$(date "+%Y-%m-%d %H:%M:%S")
timeStamp=$(date -d "$current" +%s)
currentTimeStamp=$((timeStamp*1000+`date "+%N"`/1000000))
高雅喆's avatar
高雅喆 committed
62
echo $current
高雅喆's avatar
高雅喆 committed
63 64

echo "infer native..."
高雅喆's avatar
高雅喆 committed
65
${PYTHON_PATH} ${MODEL_PATH}/Model_pipline/DeepCvrMTL.py --ctr_task_wgt=0.3 --learning_rate=0.0001 --deep_layers=256,128 --dropout=0.8,0.5 --optimizer=Adam --num_epochs=1 --embedding_size=16 --batch_size=1024 --field_size=8 --feature_size=2000 --l2_reg=0.005 --log_steps=100 --num_threads=36 --model_dir=${DATA_PATH}/model_ckpt/DeepCvrMTL/ --data_dir=${DATA_PATH}/native --task_type=infer > ${DATA_PATH}/infer.log
高雅喆's avatar
高雅喆 committed
66 67 68


echo "infer nearby..."
高雅喆's avatar
高雅喆 committed
69
${PYTHON_PATH} ${MODEL_PATH}/Model_pipline/DeepCvrMTL.py --ctr_task_wgt=0.3 --learning_rate=0.0001 --deep_layers=256,128 --dropout=0.8,0.5 --optimizer=Adam --num_epochs=1 --embedding_size=16 --batch_size=1024 --field_size=8 --feature_size=2000 --l2_reg=0.005 --log_steps=100 --num_threads=36 --model_dir=${DATA_PATH}/model_ckpt/DeepCvrMTL/ --data_dir=${DATA_PATH}/nearby --task_type=infer > ${DATA_PATH}/infer.log
高雅喆's avatar
高雅喆 committed
70 71

echo "sort and 2sql"
高雅喆's avatar
高雅喆 committed
72
${PYTHON_PATH} ${MODEL_PATH}/Model_pipline/sort_and_2sql.py
高雅喆's avatar
高雅喆 committed
73

高雅喆's avatar
高雅喆 committed
74
echo "infer and sort and 2sql time"
高雅喆's avatar
高雅喆 committed
75 76 77
current=$(date "+%Y-%m-%d %H:%M:%S")
timeStamp=$(date -d "$current" +%s)
currentTimeStamp=$((timeStamp*1000+`date "+%N"`/1000000))
高雅喆's avatar
高雅喆 committed
78
echo $current
高雅喆's avatar
高雅喆 committed
79 80

${PYTHON_PATH} ${MODEL_PATH}/Model_pipline/send_mail.py