LAP-DEV commited on
Commit
6f8989f
·
verified ·
1 Parent(s): 8e1fa57

Update modules/utils/subtitle_manager.py

Browse files
Files changed (1) hide show
  1. modules/utils/subtitle_manager.py +8 -11
modules/utils/subtitle_manager.py CHANGED
@@ -44,18 +44,15 @@ def get_srt(segments):
44
  def get_csv(segments):
45
  bDiarization = False
46
  output = ""
47
-
48
- for i, segment in enumerate(segments):
49
- if segment['text'].startswith(' '):
50
- segment['text'] = segment['text'][1:]
51
 
52
- # Check if speakers are identified and get speaker id & text
53
- temp = re.search(r'_[0-9][0-9]: ',segment['text'])
54
-
55
- if temp != None:
56
- #temp_string = str(temp.group())
57
- #speaker_id = temp_string.replace(': ','')
58
- #speaker_text = (segment['text']).replace(temp_string,'')
 
59
  speaker_id = ((segment['text']).split(":", 1)[0]).strip()
60
  speaker_text = ((segment['text']).split(":", 1)[1]).strip()
61
  output += f"{i + 1};{timeformat_srt(segment['start'])};{timeformat_srt(segment['end'])};{speaker_id};{speaker_text};\n"
 
44
  def get_csv(segments):
45
  bDiarization = False
46
  output = ""
 
 
 
 
47
 
48
+ # Check if speakers are identified
49
+ for segment in enumerate(segments):
50
+ if re.search(r'_[0-9][0-9]: ',segment['text']) != None:
51
+ bDiarization = True
52
+ break
53
+
54
+ for i, segment in enumerate(segments):
55
+ if bDiarization:
56
  speaker_id = ((segment['text']).split(":", 1)[0]).strip()
57
  speaker_text = ((segment['text']).split(":", 1)[1]).strip()
58
  output += f"{i + 1};{timeformat_srt(segment['start'])};{timeformat_srt(segment['end'])};{speaker_id};{speaker_text};\n"