adding post processing

tim-roethig-db · May 25, 2024 · 40caa99 · 40caa99
1 parent 2dc854c
commit 40caa99
Show file tree

Hide file tree

Showing 3 changed files with 27 additions and 1 deletion.
diff --git a/amondin/post_processing.py b/amondin/post_processing.py
@@ -0,0 +1,23 @@
+import pandas as pd
+
+
+def merge_rows_consecutive_speaker(transcript: pd.DataFrame) -> pd.DataFrame:
+    transcript['speaker_group'] = (transcript['speaker'] != transcript['speaker'].shift()).cumsum()
+
+    print(transcript.to_markdown())
+
+    transcript = transcript.groupby(['speaker_group', 'speaker']).agg({
+        'time_stamp': lambda x: ' '.join(x),
+        'text': lambda x: ' '.join(x)
+    }).reset_index()
+
+    transcript = transcript.drop(columns='speaker_group')
+
+    print(transcript.to_markdown())
+
+    return transcript
+
+
+if __name__ == "__main__":
+    test_transcript = pd.read_excel("../data/test_transcript.xlsx")
+    merge_rows_consecutive_speaker(transcript=test_transcript)
diff --git a/amondin/segment_speakers.py b/amondin/segment_speakers.py
@@ -65,12 +65,14 @@ def segment_speakers(
             # craft dict representing passage
             segment = {
                 "speaker": list(speaker)[0],
-                "time_stamp": str(segment),
+                "start": segment.start,
+                "end": segment.end,
                 "audio": {
                     "raw": waveform,
                     "sampling_rate": sample_rate,
                 },
             }
+            print(segment)
 
             speaker_segments.append(segment)
 

diff --git a/setup.py b/setup.py
@@ -16,5 +16,6 @@
         "numpy",
         "torch",
         "torchaudio",
+        "openpyxl",
     ]
 )