-
Notifications
You must be signed in to change notification settings - Fork 23
/
datarelease.mk
34 lines (32 loc) · 1.58 KB
/
datarelease.mk
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
webq_%:
mkdir -p webquestions-translations
python scripts/data-release.py \
< data/webquestions/$*/webquestions.dev.json \
> webquestions-translations/$*.dev.json
python scripts/data-release.py \
< data/webquestions/$*/webquestions.train.json \
> webquestions-translations/$*.train.json
python scripts/data-release.py \
< data/webquestions/$*/webquestions.test.json \
> webquestions-translations/$*.test.json
sentences_webq_%:
mkdir -p working/webquestions-translations
python scripts/data-release-senteces.py \
< data/webquestions/$*/webquestions.train.json \
| sort -n \
| cut -f2 \
> working/webquestions-translations/$*.train.txt
python scripts/data-release-senteces.py \
< data/webquestions/$*/webquestions.dev.json \
| sort -n \
| cut -f2 \
> working/webquestions-translations/$*.dev.txt
python scripts/data-release-senteces.py \
< data/webquestions/$*/webquestions.test.json \
| sort -n \
| cut -f2 \
> working/webquestions-translations/$*.test.txt
sentence_ids:
python scripts/data-release-sentece-ids.py data/WebQuestions/original/webquestions.examples.train.json working/webquestions-translations/en.train.txt > working/webquestions-translations/en.train.ids.txt
python scripts/data-release-sentece-ids.py data/WebQuestions/original/webquestions.examples.test.json working/webquestions-translations/en.test.txt > working/webquestions-translations/en.test.ids.txt
python scripts/data-release-sentece-ids.py data/WebQuestions/original/webquestions.examples.train.json working/webquestions-translations/en.dev.txt > working/webquestions-translations/en.dev.ids.txt