Skip to content

Instantly share code, notes, and snippets.

@infinex
Created June 4, 2021 05:40
Show Gist options
  • Save infinex/5d5d2e517781a72600fcf43422cd4a20 to your computer and use it in GitHub Desktop.
Save infinex/5d5d2e517781a72600fcf43422cd4a20 to your computer and use it in GitHub Desktop.
makfile
TATOEBA_RELEASED_BT = https://object.pouta.csc.fi/Tatoeba-MT-bt/released-data.txt
tatoeba-all-bt:
for b in ${shell wget -qq -O - ${TATOEBA_RELEASED_BT} | grep -v '.txt' | cut -f1 -d'/' | sort -u}; do \
s=`echo $$b | cut -f1 -d'-'`; \
t=`echo $$b | cut -f2 -d'-'`; \
echo "${MAKE} -C bt-tatoeba SRC=$$s TRG=$$t fetch-bt"; \
echo "${MAKE} MODELTYPE=transformer-align HPC_CORES=2 HPC_MEM=32g tatoeba-$${t}2$${s}-train-bt.submitcpu"; \
done
## generic target for tatoeba challenge jobs
%-tatoeba: ${TATOEBA_SRCLABELFILE} ${TATOEBA_TRGLABELFILE}
${MAKE} ${TATOEBA_PARAMS} \
LANGPAIRSTR=${LANGPAIRSTR} \
SRCLANGS="${shell cat ${word 1,$^}}" \
TRGLANGS="${shell cat ${word 2,$^}}" \
SRC=${SRC} TRG=${TRG} \
EMAIL= \
${@:-tatoeba=}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment