diff --git a/whisperx/alignment.py b/whisperx/alignment.py index 09f044f4..e2c86f74 100644 --- a/whisperx/alignment.py +++ b/whisperx/alignment.py @@ -450,8 +450,8 @@ def get_raw_text(word_row): "end": srow["end"], "text": text, "words": word_list, - # "word-segments": wseg, - # "char-segments": cseg + "word-segments": wseg, + "char-segments": cseg } ) diff --git a/whisperx/transcribe.py b/whisperx/transcribe.py index fd6cf528..dab9e127 100644 --- a/whisperx/transcribe.py +++ b/whisperx/transcribe.py @@ -203,6 +203,12 @@ def cli(): # >> Write for result, audio_path in results: + # Remove pandas dataframes from result so that + # we can serialize the result with json + for seg in result["segments"]: + seg.pop("word-segments", None) + seg.pop("char-segments", None) + writer(result, audio_path, writer_args) if __name__ == "__main__":