diff --git a/packages/transcription/README.md b/packages/transcription/README.md index 245ffa1ee311..53d291091698 100644 --- a/packages/transcription/README.md +++ b/packages/transcription/README.md @@ -17,8 +17,12 @@ Provide a common API to many transcription backend, currently : And at least one of the following transcription backend: - Python : - `openai-whisper` - - `whisper-ctranslate2` - - `whisper-timestamped` + - `whisper-ctranslate2>=0.4.3` + - `whisper-timestamped>=1.15.4` + +And to run the transcript evaluation tests : +- Python + - `jiwer>=3.04` ## Usage diff --git a/packages/transcription/src/transcript/transcript-file-evaluator.ts b/packages/transcription/src/transcript/transcript-file-evaluator.ts index 1262cddaf615..bf41d1e046be 100644 --- a/packages/transcription/src/transcript/transcript-file-evaluator.ts +++ b/packages/transcription/src/transcript/transcript-file-evaluator.ts @@ -48,15 +48,9 @@ export class TranscriptFileEvaluator { * CER: Character Error Rate */ async cer () { - // @see https://github.com/jitsi/jiwer/issues/87 - let result = { - stdout: undefined - } - try { - result = await $`jiwer ${this.buildArgs('--cer')}` - } catch {} + const { stdout: cer } = await $`jiwer ${this.buildArgs('--cer', '-g')}` - return result.stdout ? Number(result.stdout) : undefined + return cer } async alignement () {