Spaces:

chompionsawelo
/

whisper_transcribe

Runtime error

chompionsawelo commited on Aug 16, 2023

Commit

77070f9

1 Parent(s): 1c1c8cf

minor fixes

Files changed (3) hide show

diarization.py CHANGED Viewed

@@ -1,6 +1,6 @@
 from pyannote.audio import Pipeline
 from pydub import AudioSegment
-import file_name
 import torch
 import json
 import gc
@@ -52,7 +52,7 @@ def audio_segmentation(input_file, speaker_groups_dict):
 def save_groups_json(sample_groups_list: list, speaker_groups_dict: dict):
-    with open(file_name.sample_groups_json, "w", encoding="utf-8") as json_file_sample:
         json.dump(sample_groups_list, json_file_sample)
-    with open(file_name.speaker_groups_json, "w", encoding="utf-8") as json_file_speaker:
         json.dump(speaker_groups_dict, json_file_speaker)

 from pyannote.audio import Pipeline
 from pydub import AudioSegment
+from file_name import *
 import torch
 import json
 import gc
 def save_groups_json(sample_groups_list: list, speaker_groups_dict: dict):
+    with open(get_sample_groups_json(), "w", encoding="utf-8") as json_file_sample:
         json.dump(sample_groups_list, json_file_sample)
+    with open(get_speaker_groups_json(), "w", encoding="utf-8") as json_file_speaker:
         json.dump(speaker_groups_dict, json_file_speaker)

file_name.py CHANGED Viewed

@@ -34,8 +34,13 @@ def get_video_subtitle_file():
     return f"{current_working_directory}/output_{get_title()}.mp4"
 start_time_for_adjustment = "00:00:00"
 end_time_for_adjustment = "01:00:00"
-sample_groups_json = "sample_groups.json"
-speaker_groups_json = "speaker_groups.json"

     return f"{current_working_directory}/output_{get_title()}.mp4"
+def get_sample_groups_json():
+    return f"{current_working_directory}/sample_groups_{get_title()}.json"
+def get_speaker_groups_json():
+    return f"{current_working_directory}/speaker_groups_{get_title()}.json"
 start_time_for_adjustment = "00:00:00"
 end_time_for_adjustment = "01:00:00"

utils.py CHANGED Viewed

@@ -4,14 +4,14 @@ import os
 def load_groups_json():
-    sample_groups_list = []
-    speaker_groups_dict = []
-    if os.path.exists(sample_groups_json):
-        with open(sample_groups_json, "r", encoding="utf-8") as json_file_sample:
-            sample_groups_list: list = json.load(json_file_sample)
-    if os.path.exists(speaker_groups_json):
-        with open(speaker_groups_json, "r", encoding="utf-8") as json_file_speaker:
-            speaker_groups_dict: dict = json.load(json_file_speaker)
     return sample_groups_list, speaker_groups_dict
@@ -35,12 +35,12 @@ def read_transcribe_subtitle_file(adjustment: bool):
         transcribe = get_transcribe_adjusted_file()
         subtitle = get_subtitle_adjusted_file()
-    transcribe_txt_list = []
-    subtitle_txt_list = []
-    if os.path.exists(transcribe):
-        with open(transcribe, "r", encoding="utf-8") as file:
-            transcribe_txt_list = file.readlines()
-    if os.path.exists(subtitle):
-        with open(subtitle, "r", encoding="utf-8") as file:
-            subtitle_txt_list = file.readlines()
     return transcribe_txt_list, subtitle_txt_list

 def load_groups_json():
+    if not os.path.exists(get_sample_groups_json()) or not os.path.exists(get_speaker_groups_json()):
+        print("JSON file doesn't exist")
+        return [], {}
+    with open(get_sample_groups_json(), "r", encoding="utf-8") as json_file_sample:
+        sample_groups_list: list = json.load(json_file_sample)
+    with open(get_speaker_groups_json(), "r", encoding="utf-8") as json_file_speaker:
+        speaker_groups_dict: dict = json.load(json_file_speaker)
     return sample_groups_list, speaker_groups_dict
         transcribe = get_transcribe_adjusted_file()
         subtitle = get_subtitle_adjusted_file()
+    if not os.path.exists(transcribe) or not os.path.exists(subtitle):
+        print("Transcribe or subtitle file doesn't exist")
+        return [], []
+    with open(transcribe, "r", encoding="utf-8") as file:
+        transcribe_txt_list = file.readlines()
+    with open(subtitle, "r", encoding="utf-8") as file:
+        subtitle_txt_list = file.readlines()
     return transcribe_txt_list, subtitle_txt_list