all-in-one

Sleeping

helloWorld199 commited on Jun 15, 2024

Commit

9f42652

verified ·

1 Parent(s): 703fb58

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -188,8 +188,9 @@ def add_voice_labelv2(json_file, audio_path):
         speech_prob = model(chunk, SAMPLING_RATE).item()
         speech_probs.append(speech_prob)
     vad_iterator.reset_states() # reset model states after each audio
     voice_idxs = np.where(np.array(speech_probs) >= 0.7)
     if len(voice_idxs) == 0:
         print("NO VOICE SEGMENTS DETECTED!")
     try:
@@ -202,7 +203,7 @@ def add_voice_labelv2(json_file, audio_path):
                 begin_seq = False
             if voice_idxs[i+1] == voice_idxs[i]+1:
                 continue
             start_time = float((start_idx*window_size_samples)/SAMPLING_RATE)
             end_time = float((voice_idxs[i]*window_size_samples)/SAMPLING_RATE)
@@ -210,7 +211,8 @@ def add_voice_labelv2(json_file, audio_path):
             end_minutes = int(end_time)
             start_seconds = (start_time - start_minutes) * 60
             end_seconds = (end_time - end_minutes) * 60
             data['vocal_times'] = {
             "start_time": f"{start_minutes}.{start_seconds:.2f}",
             "end_time": f"{end_minutes}.{end_seconds:.2f}"
@@ -224,6 +226,7 @@ def add_voice_labelv2(json_file, audio_path):
         print(f"An exception occurred: {e}")
     with open(json_file, 'w') as f:
         json.dump(data, f, indent=4)
 with gr.Blocks() as demo:

         speech_prob = model(chunk, SAMPLING_RATE).item()
         speech_probs.append(speech_prob)
     vad_iterator.reset_states() # reset model states after each audio
     voice_idxs = np.where(np.array(speech_probs) >= 0.7)
+    print(len(np.where(np.array(speech_probs) >= 0.7))
     if len(voice_idxs) == 0:
         print("NO VOICE SEGMENTS DETECTED!")
     try:
                 begin_seq = False
             if voice_idxs[i+1] == voice_idxs[i]+1:
                 continue
             start_time = float((start_idx*window_size_samples)/SAMPLING_RATE)
             end_time = float((voice_idxs[i]*window_size_samples)/SAMPLING_RATE)
             end_minutes = int(end_time)
             start_seconds = (start_time - start_minutes) * 60
             end_seconds = (end_time - end_minutes) * 60
+            print("modifying json data... \n")
             data['vocal_times'] = {
             "start_time": f"{start_minutes}.{start_seconds:.2f}",
             "end_time": f"{end_minutes}.{end_seconds:.2f}"
         print(f"An exception occurred: {e}")
     with open(json_file, 'w') as f:
+        print("writing_to_json...")
         json.dump(data, f, indent=4)
 with gr.Blocks() as demo: