-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathpredict.sh
executable file
·132 lines (114 loc) · 3.67 KB
/
predict.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
#!/bin/bash
# production mode
# get it from https://github.com/acoli-repo/acoli-dicts
DICTS=../../../acoli-dicts/trunk/stable/
# reduce min_pivot from optimum to lower values
# if min_pivot==1, generate both with and without English
# run for levels 0, 1 and 2/3 separately, then merge
# after generation
# no English, incl. DiscMar, all dicts
# for tgt in de cs fr pt it nl ca es; do
# dimlex=`ls ../tsv/*tsv | grep -v 'ted' | grep -v arabic | grep -v bangla | grep -v discmar.en | grep -v pdtb`;
# for DICT in $DICTS; do
# echo $tgt $DICT, no English, PDTB0 1 sense
# dicts=`find $DICT | egrep tsv.gz`
# python3 induce-dimlex.py \
# --dimlex $dimlex \
# --dict $dicts \
# --tgt $tgt \
# --th_steps 20 \
# --max_senses 1\
# --test_pivlangs 7 \
# --silent | \
# perl -pe 's/\./,/g; s/ +/\t/g;'
# echo
# done
# done
# # for tgt in de cs fr pt it nl ca es; do
# dimlex=`ls ../tsv/*tsv | grep -v 'ted' | grep -v arabic | grep -v bangla | grep -v discmar.en | grep -v pdtb`;
# for DICT in $DICTS; do
# echo $tgt $DICT, no English, PDTB1 2 senses
# dicts=`find $DICT | egrep tsv.gz`
# #--tgt de cs fr pt it nl ca es
# python3 induce-dimlex.py \
# --dimlex $dimlex \
# --dict $dicts \
# --tgt ca es \
# --th_steps 20 \
# --max_senses 2\
# --test_pivlangs 7 \
# --silent | \
# perl -pe 's/\./,/g; s/ +/\t/g;'
# echo
# done
# # done
DICTS=pruned-dicts/
# for tgt in de cs fr pt it nl ; do
dimlex=`ls ../tsv/*tsv | grep -v 'ted' | grep -v arabic | grep -v bangla | grep -v discmar | grep -v pdtb`;
for DICT in $DICTS; do
echo $tgt $DICT, no English, no DiscMar PDTB2/3 4 sense
dicts=`find $DICT | egrep tsv.gz`
python3 induce-dimlex.py \
--dimlex $dimlex \
--dict $dicts \
--tgt de cs fr pt it nl \
--th_steps 20 \
--max_senses 4\
--test_pivlangs 5 \
--silent | \
perl -pe 's/\./,/g; s/ +/\t/g;'
echo
done
# done
# w. English
# # for tgt in en de cs fr pt it nl ca es; do
# dimlex=`ls ../tsv/*tsv | grep -v 'ted' | grep -v arabic | grep -v bangla | grep -v discmar.en `;
# for DICT in $DICTS; do
# echo $tgt $DICT, incl. English PDTB, PDTB0 1 sense
# dicts=`find $DICT | egrep tsv.gz`
# python3 induce-dimlex.py \
# --dimlex $dimlex \
# --dict $dicts \
# --tgt en de cs fr pt it nl ca es \
# --th_steps 20 \
# --max_senses 1\
# --test_pivlangs 8 \
# --silent | \
# perl -pe 's/\./,/g; s/ +/\t/g;'
# echo
# done
# # done
# # for tgt in en de cs fr pt it nl ca es; do
# dimlex=`ls ../tsv/*tsv | grep -v 'ted' | grep -v arabic | grep -v bangla | grep -v discmar.en `;
# for DICT in $DICTS; do
# echo $tgt $DICT, incl. English PDTB, PDTB1 2 senses
# dicts=`find $DICT | egrep tsv.gz`
# python3 induce-dimlex.py \
# --dimlex $dimlex \
# --dict $dicts \
# --tgt en de cs fr pt it nl ca es \
# --th_steps 20 \
# --max_senses 2\
# --test_pivlangs 8 \
# --silent | \
# perl -pe 's/\./,/g; s/ +/\t/g;'
# echo
# done
# # done
# for tgt in en de cs fr pt it nl ; do
dimlex=`ls ../tsv/*tsv | grep -v 'ted' | grep -v arabic | grep -v bangla | grep -v discmar`;
for DICT in $DICTS; do
echo $tgt $DICT, incl. English PDTB, no DiscMar PDTB2/3 4 senses
dicts=`find $DICT | egrep tsv.gz`
python3 induce-dimlex.py \
--dimlex $dimlex \
--dict $dicts \
--tgt en de cs fr pt it nl \
--th_steps 20 \
--max_senses 4\
--test_pivlangs 6 \
--silent | \
perl -pe 's/\./,/g; s/ +/\t/g;'
echo
done
# done