Spaces:

GreenRaptor
/

MMS

Runtime error

App Files Files Community

MMS / mms_infer.py

GreenRaptor

Update mms_infer.py

3533765 over 2 years ago

raw

history blame contribute delete

2.33 kB

	#!/usr/bin/env python -u
	# Copyright (c) Facebook, Inc. and its affiliates.
	#
	# This source code is licensed under the MIT license found in the
	# LICENSE file in the root directory of this source tree.

	import argparse
	import soundfile as sf
	import tempfile
	from pathlib import Path
	import os
	import subprocess
	import sys
	import re

	def parser():
	parser = argparse.ArgumentParser(description="ASR inference script for MMS model")
	parser.add_argument("--model", type=str, help="path to ASR model", required=True)
	parser.add_argument("--audio", type=str, help="path to audio file", required=True, nargs='+')
	parser.add_argument("--lang", type=str, help="audio language", required=True)
	parser.add_argument("--format", type=str, choices=["none", "letter"], default="letter")
	return parser.parse_args()

	def process(args):
	with tempfile.TemporaryDirectory() as tmpdir:
	print(">>> preparing tmp manifest dir ...", file=sys.stderr)
	tmpdir = Path(tmpdir)
	with open(tmpdir / "dev.tsv", "w") as fw:
	fw.write("/\n")
	for audio in args.audio:
	nsample = sf.SoundFile(audio).frames
	fw.write(f"{audio}\t{nsample}\n")
	with open(tmpdir / "dev.uid", "w") as fw:
	fw.write(f"{audio}\n"*len(args.audio))
	with open(tmpdir / "dev.ltr", "w") as fw:
	fw.write("d u m m y \| d u m m y\n"*len(args.audio))
	with open(tmpdir / "dev.wrd", "w") as fw:
	fw.write("dummy dummy\n"*len(args.audio))
	cmd = f"""
	PYTHONPATH=. PREFIX=INFER HYDRA_FULL_ERROR=1 python infer.py -m decoding.type=viterbi dataset.max_tokens=4000000 distributed_training.distributed_world_size=1 "common_eval.path='{args.model}'" task.data={tmpdir} dataset.gen_subset="{args.lang}:dev" common_eval.post_process={args.format} decoding.results_path={tmpdir}
	"""
	print(">>> loading model & running inference ...", file=sys.stderr)
	subprocess.run(cmd, shell=True, stdout=subprocess.DEVNULL,)
	with open(tmpdir/"hypo.word") as fr:
	for ii, hypo in enumerate(fr):
	hypo = re.sub("$\S+$$", "", hypo).strip()
	print(f'===============\nInput: {args.audio[ii]}\nOutput: {hypo}')


	if __name__ == "__main__":
	args = parser()
	process(args)