in STT/faster_whisper_handler.py [0:0]
def process(self, audio):
logger.debug("infering faster whisper...")
global pipeline_start
pipeline_start = perf_counter()
segments, info = self.model.transcribe(audio, **self.gen_kwargs)
output_text = []
for segment in segments:
logger.debug(
"[%.2fs -> %.2fs] %s" % (segment.start, segment.end, segment.text)
)
output_text.append(segment.text)
pred_text = " ".join(output_text).strip()
logger.debug("finished whisper inference")
if pred_text:
console.print(f"[yellow]USER: {pred_text}")
yield pred_text
else:
logger.debug("no text detected. skipping...")