Migrate to WhisperX for speaker diarization

Implement a sliding window audio buffer and update the transcriber to
use WhisperX for transcription, alignment, and speaker identification.
Update the pipeline to handle and store speaker-attributed transcripts.

Additionally, update the LLM processor's reasoning parameter to
"enable_thinking".
This commit is contained in:
2026-05-26 21:48:30 -07:00
parent d0fcdfab01
commit f4c98fb2b9
7 changed files with 135 additions and 38 deletions
+2 -2
View File
@@ -83,7 +83,7 @@ class LLMProcessor:
model=self.model,
messages=messages,
response_format=response_format,
extra_body={"include_reasoning": False},
extra_body={"enable_thinking": False},
)
return response.choices[0].message.content
except Exception as e:
@@ -125,7 +125,7 @@ class LLMProcessor:
model=self.model,
messages=messages,
response_format={"type": "json_object"},
extra_body={"include_reasoning": False},
extra_body={"enable_thinking": False},
)
logger.info("LLM Processor (Extract): Response received from backend.")