Skip to content

Commit f8bc7ae

Browse files
Add files via upload
1 parent a2a3135 commit f8bc7ae

File tree

3 files changed

+126
-0
lines changed

3 files changed

+126
-0
lines changed

src/qs/cair/scripts/multitask.sh

Lines changed: 42 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,42 @@
1+
#!/usr/bin/env bash
2+
3+
SRC_DIR=../
4+
DATA_DIR=${SRC_DIR}/data/
5+
EMBED_DIR=${SRC_DIR}/data/fasttext/
6+
MODEL_DIR=${SRC_DIR}/tmp/
7+
8+
RGPU=$1
9+
MODEL_NAME=$2
10+
DATASET=msmarco
11+
12+
13+
PYTHONPATH=$SRC_DIR CUDA_VISIBLE_DEVICES=$RGPU python -W ignore ${SRC_DIR}/main/multitask.py \
14+
--model_type $MODEL_NAME \
15+
--train_file train.json \
16+
--dev_file dev.json \
17+
--test_file test.json \
18+
--max_doc_len 200 \
19+
--max_query_len 20 \
20+
--uncase True \
21+
--max_examples -1 \
22+
--emsize 300 \
23+
--batch_size 32 \
24+
--test_batch_size 32 \
25+
--num_epochs 50 \
26+
--dropout_emb 0.2 \
27+
--dropout 0.2 \
28+
--dropout_rnn 0.2 \
29+
--optimizer adam \
30+
--learning_rate 0.001 \
31+
--weight_decay 0.0 \
32+
--early_stop 5 \
33+
--valid_metric bleu \
34+
--checkpoint True \
35+
--model_dir $MODEL_DIR \
36+
--model_name $MODEL_NAME \
37+
--only_test False \
38+
--data_workers 5 \
39+
--dataset_name $DATASET \
40+
--data_dir ${DATA_DIR}/${DATASET}/ \
41+
--embed_dir $EMBED_DIR \
42+
--embedding_file crawl-300d-2M-subword.vec

src/qs/cair/scripts/ranker.sh

Lines changed: 43 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,43 @@
1+
#!/usr/bin/env bash
2+
3+
SRC_DIR=../
4+
DATA_DIR=${SRC_DIR}/data/
5+
EMBED_DIR=${SRC_DIR}/data/fasttext/
6+
MODEL_DIR=${SRC_DIR}/tmp/
7+
8+
RGPU=$1
9+
MODEL_NAME=$2
10+
DATASET=msmarco
11+
12+
13+
PYTHONPATH=$SRC_DIR CUDA_VISIBLE_DEVICES=$RGPU python -W ignore ${SRC_DIR}/main/ranker.py \
14+
--model_type $MODEL_NAME \
15+
--train_file train.json \
16+
--dev_file dev.json \
17+
--test_file test.json \
18+
--max_doc_len 200 \
19+
--max_query_len 20 \
20+
--uncase True \
21+
--num_candidates 10 \
22+
--max_examples -1 \
23+
--emsize 300 \
24+
--batch_size 64 \
25+
--test_batch_size 64 \
26+
--num_epochs 50 \
27+
--dropout_emb 0.2 \
28+
--dropout 0.2 \
29+
--dropout_rnn 0.2 \
30+
--optimizer adam \
31+
--learning_rate 0.001 \
32+
--weight_decay 0.0 \
33+
--early_stop 5 \
34+
--valid_metric map \
35+
--checkpoint True \
36+
--model_dir $MODEL_DIR \
37+
--model_name $MODEL_NAME \
38+
--only_test False \
39+
--data_workers 5 \
40+
--dataset_name $DATASET \
41+
--data_dir ${DATA_DIR}/${DATASET}/ \
42+
--embed_dir $EMBED_DIR \
43+
--embedding_file crawl-300d-2M-subword.vec

src/qs/cair/scripts/recommender.sh

Lines changed: 41 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,41 @@
1+
#!/usr/bin/env bash
2+
3+
SRC_DIR=../
4+
DATA_DIR=${SRC_DIR}/data/
5+
EMBED_DIR=${SRC_DIR}/data/fasttext/
6+
MODEL_DIR=${SRC_DIR}/tmp/
7+
8+
RGPU=$1
9+
MODEL_NAME=$2
10+
DATASET=msmarco
11+
12+
PYTHONPATH=$SRC_DIR CUDA_VISIBLE_DEVICES=$RGPU python:wq -W ignore ${SRC_DIR}/main/recommender.py \
13+
--model_type $MODEL_NAME \
14+
--train_file train.json \
15+
--dev_file dev.json \
16+
--test_file test.json \
17+
--max_query_len 20 \
18+
--uncase True \
19+
--num_candidates 10 \
20+
--max_examples -1 \
21+
--emsize 300 \
22+
--batch_size 64 \
23+
--test_batch_size 64 \
24+
--num_epochs 50 \
25+
--dropout_emb 0.2 \
26+
--dropout 0.2 \
27+
--dropout_rnn 0.2 \
28+
--optimizer adam \
29+
--learning_rate 0.001 \
30+
--weight_decay 0.0 \
31+
--early_stop 5 \
32+
--valid_metric bleu \
33+
--checkpoint True \
34+
--model_dir $MODEL_DIR \
35+
--model_name $MODEL_NAME \
36+
--only_test False \
37+
--data_workers 5 \
38+
--dataset_name $DATASET \
39+
--data_dir ${DATA_DIR}/${DATASET}/ \
40+
--embed_dir $EMBED_DIR \
41+
--embedding_file crawl-300d-2M-subword.vec

0 commit comments

Comments
 (0)