Spaces:
				
			
			
	
			
			
		Runtime error
		
	
	
	
			
			
	
	
	
	
		
		
		Runtime error
		
	| src_lang=${1:-hi} | |
| tgt_lang=${2:-en} | |
| bucket_path=${3:-gs://ai4b-anuvaad-nmt/baselines/transformer-base/baselines-${src_lang}-${tgt_lang}} | |
| expdir=../baselines/baselines-${src_lang}-${tgt_lang} | |
| if [[ -d $expdir ]] | |
| then | |
| echo "$expdir exists on your filesystem. Please delete this if you have made some changes to the bucket files and trying to redownload" | |
| else | |
| mkdir -p $expdir | |
| mkdir -p $expdir/model | |
| cd ../baselines | |
| gsutil -m cp -r $bucket_path/vocab $expdir | |
| gsutil -m cp -r $bucket_path/final_bin $expdir | |
| gsutil -m cp $bucket_path/model/checkpoint_best.pt $expdir/model | |
| cd ../indicTrans | |
| fi | |
| if [ $src_lang == 'hi' ] || [ $tgt_lang == 'hi' ]; then | |
| #TEST_SETS=( wmt-news wat2021-devtest wat2020-devtest anuvaad-legal tico19 sap-documentation-benchmark all) | |
| TEST_SETS=( wat2021-devtest wat2020-devtest wat-2018 wmt-news ) | |
| elif [ $src_lang == 'ta' ] || [ $tgt_lang == 'ta' ]; then | |
| # TEST_SETS=( wmt-news wat2021-devtest wat2020-devtest anuvaad-legal tico19 all) | |
| TEST_SETS=( wat2021-devtest wat2020-devtest wat-2018 wmt-news ufal-ta) | |
| elif [ $src_lang == 'bn' ] || [ $tgt_lang == 'bn' ]; then | |
| # TEST_SETS=( wat2021-devtest wat2020-devtest anuvaad-legal tico19 all) | |
| TEST_SETS=( wat2021-devtest wat2020-devtest wat-2018) | |
| elif [ $src_lang == 'gu' ] || [ $tgt_lang == 'gu' ]; then | |
| # TEST_SETS=( wmt-news wat2021-devtest wat2020-devtest all) | |
| TEST_SETS=( wat2021-devtest wat2020-devtest wmt-news ) | |
| elif [ $src_lang == 'as' ] || [ $tgt_lang == 'as' ]; then | |
| TEST_SETS=( pmi ) | |
| elif [ $src_lang == 'kn' ] || [ $tgt_lang == 'kn' ]; then | |
| # TEST_SETS=( wat2021-devtest anuvaad-legal all) | |
| TEST_SETS=( wat2021-devtest ) | |
| elif [ $src_lang == 'ml' ] || [ $tgt_lang == 'ml' ]; then | |
| # TEST_SETS=( wat2021-devtest wat2020-devtest anuvaad-legal all) | |
| TEST_SETS=( wat2021-devtest wat2020-devtest wat-2018) | |
| elif [ $src_lang == 'mr' ] || [ $tgt_lang == 'mr' ]; then | |
| # TEST_SETS=( wat2021-devtest wat2020-devtest all) | |
| TEST_SETS=( wat2021-devtest wat2020-devtest ) | |
| elif [ $src_lang == 'or' ] || [ $tgt_lang == 'or' ]; then | |
| TEST_SETS=( wat2021-devtest ) | |
| elif [ $src_lang == 'pa' ] || [ $tgt_lang == 'pa' ]; then | |
| TEST_SETS=( wat2021-devtest ) | |
| elif [ $src_lang == 'te' ] || [ $tgt_lang == 'te' ]; then | |
| # TEST_SETS=( wat2021-devtest wat2020-devtest anuvaad-legal all ) | |
| TEST_SETS=( wat2021-devtest wat2020-devtest wat-2018) | |
| fi | |
| if [ $src_lang == 'en' ]; then | |
| indic_lang=$tgt_lang | |
| else | |
| indic_lang=$src_lang | |
| fi | |
| for tset in ${TEST_SETS[@]};do | |
| echo $tset $src_lang $tgt_lang | |
| if [ $tset == 'wat2021-devtest' ]; then | |
| SRC_FILE=${expdir}/benchmarks/$tset/test.$src_lang | |
| REF_FILE=${expdir}/benchmarks/$tset/test.$tgt_lang | |
| else | |
| SRC_FILE=${expdir}/benchmarks/$tset/en-${indic_lang}/test.$src_lang | |
| REF_FILE=${expdir}/benchmarks/$tset/en-${indic_lang}/test.$tgt_lang | |
| fi | |
| RESULTS_DIR=${expdir}/results/$tset | |
| mkdir -p $RESULTS_DIR | |
| bash translate.sh $SRC_FILE $RESULTS_DIR/${src_lang}-${tgt_lang} $src_lang $tgt_lang $expdir $REF_FILE | |
| # for newline between different outputs | |
| echo | |
| done | |
| # send the results to the bucket | |
| gsutil -m cp -r $expdir/results $bucket_path | |
| # clear up the space in the instance | |
| # rm -r $expdir | 
