#!/bin/usr/env sh # Copyright (c) 2018-present, Facebook, Inc. # All rights reserved. # # This source code is licensed under the license found in the # LICENSE file in the root directory of this source tree. set -e s=${1:-en} t=${2:-es} echo "Example based on the ${s}->${t} alignment" if [ ! -d data/ ]; then mkdir -p data; fi if [ ! -d res/ ]; then mkdir -p res; fi dico_train=data/${s}-${t}.0-5000.txt if [ ! -f "${dico_train}" ]; then DICO=$(basename -- "${dico_train}") wget -c "https://s3.amazonaws.com/arrival/dictionaries/${DICO}" -P data/ fi dico_test=data/${s}-${t}.5000-6500.txt if [ ! -f "${dico_test}" ]; then DICO=$(basename -- "${dico_test}") wget -c "https://s3.amazonaws.com/arrival/dictionaries/${DICO}" -P data/ fi src_emb=data/wiki.${s}.vec if [ ! -f "${src_emb}" ]; then DICO=$(basename -- "${src_emb}") wget -c "https://s3-us-west-1.amazonaws.com/fasttext-vectors/${DICO}" -P data/ fi tgt_emb=data/wiki.${t}.vec if [ ! -f "${tgt_emb}" ]; then DICO=$(basename -- "${tgt_emb}") wget -c "https://s3-us-west-1.amazonaws.com/fasttext-vectors/${DICO}" -P data/ fi output=res/wiki.${s}-${t}.vec python3 align.py --src_emb "${src_emb}" --tgt_emb "${tgt_emb}" \ --dico_train "${dico_train}" --dico_test "${dico_test}" --output "${output}" \ --lr 25 --niter 10 python3 eval.py --src_emb "${output}" --tgt_emb "${tgt_emb}" \ --dico_test "${dico_test}"