Spaces:
				
			
			
	
			
			
		Running
		
			on 
			
			Zero
	
	
	
			
			
	
	
	
	
		
		
		Running
		
			on 
			
			Zero
	Update app.py
Browse files
    	
        app.py
    CHANGED
    
    | @@ -27,6 +27,7 @@ from infer.utils_infer import ( | |
| 27 | 
             
                remove_silence_for_generated_wav,
         | 
| 28 | 
             
                save_spectrogram,
         | 
| 29 | 
             
            )
         | 
|  | |
| 30 | 
             
            from transformers import pipeline
         | 
| 31 | 
             
            import click
         | 
| 32 | 
             
            import soundfile as sf
         | 
| @@ -245,7 +246,11 @@ def infer_batch(ref_audio, ref_text, gen_text_batches, exp_name, remove_silence, | |
| 245 | 
             
                for i, gen_text in enumerate(progress.tqdm(gen_text_batches)):
         | 
| 246 | 
             
                    # Prepare the text
         | 
| 247 | 
             
                    text_list = [ref_text + gen_text]
         | 
| 248 | 
            -
                     | 
|  | |
|  | |
|  | |
|  | |
| 249 |  | 
| 250 | 
             
                    # Calculate reference audio length
         | 
| 251 | 
             
                    ref_audio_len = audio.shape[-1] // hop_length
         | 
|  | |
| 27 | 
             
                remove_silence_for_generated_wav,
         | 
| 28 | 
             
                save_spectrogram,
         | 
| 29 | 
             
            )
         | 
| 30 | 
            +
            from tokenizers import Tokenizer
         | 
| 31 | 
             
            from transformers import pipeline
         | 
| 32 | 
             
            import click
         | 
| 33 | 
             
            import soundfile as sf
         | 
|  | |
| 246 | 
             
                for i, gen_text in enumerate(progress.tqdm(gen_text_batches)):
         | 
| 247 | 
             
                    # Prepare the text
         | 
| 248 | 
             
                    text_list = [ref_text + gen_text]
         | 
| 249 | 
            +
                    encoding = tokenizer.encode(text_list)
         | 
| 250 | 
            +
                    tokens = encoding.tokens
         | 
| 251 | 
            +
                    text_list = ' '.join(map(str, tokens))
         | 
| 252 | 
            +
             | 
| 253 | 
            +
                    final_text_list = [text_list]
         | 
| 254 |  | 
| 255 | 
             
                    # Calculate reference audio length
         | 
| 256 | 
             
                    ref_audio_len = audio.shape[-1] // hop_length
         |