Skip to content

Commit

Permalink
adding min and max speaker support
Browse files Browse the repository at this point in the history
  • Loading branch information
tim-roethig-db committed May 25, 2024
1 parent 91d355a commit 3f7e105
Showing 1 changed file with 17 additions and 16 deletions.
33 changes: 17 additions & 16 deletions amondin/segment_speakers.py
Original file line number Diff line number Diff line change
Expand Up @@ -53,24 +53,25 @@ def segment_speakers(
speaker_segments = []
for segment in segments:
print(segment.duration)
# get audio passages as numpy array
waveform, sample_rate = Audio().crop(audio, segment, mode="pad")
waveform = torch.squeeze(waveform)
waveform = waveform.numpy()
if segment.duration > 0.05:
# get audio passages as numpy array
waveform, sample_rate = Audio().crop(audio, segment, mode="pad")
waveform = torch.squeeze(waveform)
waveform = waveform.numpy()

# get speaker belonging to audio
speaker = annotation.get_labels(segment)
# get speaker belonging to audio
speaker = annotation.get_labels(segment)

# craft dict representing passage
segment = {
"speaker": list(speaker)[0],
"time_stamp": str(segment),
"audio": {
"raw": waveform,
"sampling_rate": sample_rate,
},
}
# craft dict representing passage
segment = {
"speaker": list(speaker)[0],
"time_stamp": str(segment),
"audio": {
"raw": waveform,
"sampling_rate": sample_rate,
},
}

speaker_segments.append(segment)
speaker_segments.append(segment)

return speaker_segments

0 comments on commit 3f7e105

Please sign in to comment.