forked from facebookresearch/MUSE
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathfexample.sh
61 lines (50 loc) · 1.66 KB
/
fexample.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
#!/bin/usr/env sh
# Copyright (c) 2018-present, Facebook, Inc.
# All rights reserved.
#
# This source code is licensed under the license found in the
# LICENSE file in the root directory of this source tree.
cd MUSE
#wget https://dl.fbaipublicfiles.com/arrival/vectors.tar.gz
wget https://dl.fbaipublicfiles.com/arrival/wordsim.tar.gz -P ./data/
#wget https://dl.fbaipublicfiles.com/arrival/dictionaries.tar.gz
tar -xzf ./data/wordsim.tar.gz -C ./data/
mv ./data/wordsim ./data/monolingual
set -e
s=${1:-en}
t=${2:-hi}
echo "Example based on the ${s}->${t} alignment"
if [ ! -d data/ ]; then
mkdir -p data;
fi
if [ ! -d res/ ]; then
mkdir -p res;
fi
dico_train=data/${s}-${t}.0-5000.txt
if [ ! -f "${dico_train}" ]; then
DICO=$(basename -- "${dico_train}")
wget -c "https://dl.fbaipublicfiles.com/arrival/dictionaries/${DICO}" -P data/
fi
dico_test=data/${s}-${t}.5000-6500.txt
if [ ! -f "${dico_test}" ]; then
DICO=$(basename -- "${dico_test}")
wget -c "https://dl.fbaipublicfiles.com/arrival/dictionaries/${DICO}" -P data/
fi
src_emb=data/wiki.${s}.vec
if [ ! -f "${src_emb}" ]; then
EMB=$(basename -- "${src_emb}")
wget -c "https://dl.fbaipublicfiles.com/fasttext/vectors-wiki/${EMB}" -P data/
fi
tgt_emb=data/wiki.${t}.vec
if [ ! -f "${tgt_emb}" ]; then
EMB=$(basename -- "${tgt_emb}")
wget -c "https://dl.fbaipublicfiles.com/fasttext/vectors-wiki/${EMB}" -P data/
fi
#output=res/wiki.${s}-${t}.vec
#
#python3 align.py --src_emb "${src_emb}" --tgt_emb "${tgt_emb}" \
# --dico_train "${dico_train}" --dico_test "${dico_test}" --output "${output}" \
# --lr 25 --niter 10
#python3 eval.py --src_emb "${output}" --tgt_emb "${tgt_emb}" \
# --dico_test "${dico_test}"
#