forked from menggehe/DRAW
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathpreprocess_AGENDA.sh
26 lines (21 loc) · 1.05 KB
/
preprocess_AGENDA.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
#!/bin/bash
if [ "$#" -lt 1 ]; then
echo "./preprocess_AGENDA.sh <dataset_folder>"
exit 2
fi
processed_data_folder='graph2text/data/agenda'
mkdir -p ${processed_data_folder}
python preprocess/generate_input_agenda.py ${1} ${processed_data_folder}
python graph2text/preprocess.py -train_src ${processed_data_folder}/training-nodes.txt \
-train_graph ${processed_data_folder}/training-graph.txt \
-train_tgt ${processed_data_folder}/training-surface.txt \
-valid_src ${processed_data_folder}/dev-nodes.txt \
-valid_graph ${processed_data_folder}/dev-graph.txt \
-valid_tgt ${processed_data_folder}/dev-surface.txt \
-save_data ${processed_data_folder}/agenda \
-src_vocab_size 30000 \
-tgt_vocab_size 30000 \
-src_seq_length 10000 \
-tgt_seq_length 10000 \
-dynamic_dict \
-share_vocab