#!/bin/bash
#
#SBATCH --mail-user=andrew.dyer.6854@student.uu.se
#SBATCH --mail-type=ALL
#
# Job name:
#SBATCH --job-name=mapping_supervised
#
# Project:
#SBATCH --account=nn9447k
#
# Wall clock limit:
#SBATCH --time=02:00:00
#
# Max memory usage per task:
#SBATCH --mem-per-cpu=20000
#
#qlogin --account=nn9447k  --partition=accel --gres=gpu:1

#
## Set up job environment:
module purge   # clear any inherited modules
set -o errexit # exit on errors

USER=/usit/abel/u1/andidyer
VENV=/usit/abel/u1/andidyer/.local/share/virtualenvs/Synthetic-PRwNTqdM

## Run command
cd $scratch
LANG=$1
TRAINDICT=$2
SUPERVISION=$3
TGT_EMB=$(ls /usit/abel/u1/andidyer/nobackup/facebook_embeddings/$LANG/ | grep 'normed')
src_id=en
tgt_id=${TGT_EMB%%.vec*}

if [ ! -d /usit/abel/u1/andidyer/output_embeddings_semi-supervised/$LANG/ ]
then
    mkdir /usit/abel/u1/andidyer/output_embeddings_semi-supervised/$LANG/
fi

source $VENV/bin/activate

python ~/vecmap/map_embeddings.py \
$SUPERVISION \
$TRAINDICT \
$USER/nobackup/facebook_embeddings/English/en.vectors.normed.txt \
$USER/nobackup/facebook_embeddings/$LANG/$TGT_EMB \
$USER/output_embeddings_semi-supervised/$LANG/${src_id}-${tgt_id}_$src_id.txt \
$USER/output_embeddings_semi-supervised/$LANG/${src_id}-${tgt_id}_$tgt_id.txt \
--batch_size 512 \
--vocabulary_cutoff 1000 \
--verbose \
--cuda \