1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51
|
#!/bin/usr/env sh
# Copyright (c) 2018-present, Facebook, Inc.
# All rights reserved.
#
# This source code is licensed under the license found in the
# LICENSE file in the root directory of this source tree.
set -e
s=${1:-en}
t=${2:-es}
echo "Example based on the ${s}->${t} alignment"
if [ ! -d data/ ]; then
mkdir -p data;
fi
if [ ! -d res/ ]; then
mkdir -p res;
fi
dico_train=data/${s}-${t}.0-5000.txt
if [ ! -f "${dico_train}" ]; then
DICO=$(basename -- "${dico_train}")
wget -c "https://dl.fbaipublicfiles.com/arrival/dictionaries/${DICO}" -P data/
fi
dico_test=data/${s}-${t}.5000-6500.txt
if [ ! -f "${dico_test}" ]; then
DICO=$(basename -- "${dico_test}")
wget -c "https://dl.fbaipublicfiles.com/arrival/dictionaries/${DICO}" -P data/
fi
src_emb=data/wiki.${s}.vec
if [ ! -f "${src_emb}" ]; then
EMB=$(basename -- "${src_emb}")
wget -c "https://dl.fbaipublicfiles.com/fasttext/vectors-wiki/${EMB}" -P data/
fi
tgt_emb=data/wiki.${t}.vec
if [ ! -f "${tgt_emb}" ]; then
EMB=$(basename -- "${tgt_emb}")
wget -c "https://dl.fbaipublicfiles.com/fasttext/vectors-wiki/${EMB}" -P data/
fi
output=res/wiki.${s}-${t}.vec
python3 align.py --src_emb "${src_emb}" --tgt_emb "${tgt_emb}" \
--dico_train "${dico_train}" --dico_test "${dico_test}" --output "${output}" \
--lr 25 --niter 10
python3 eval.py --src_emb "${output}" --tgt_emb "${tgt_emb}" \
--dico_test "${dico_test}"
|