Merge pull request #8 from nextcloud/feat/compute-device

feat: detect computation device for Whisper model
nextcloud · Oct 30, 2024 · 4ca8f89 · 4ca8f89
2 parents 13f70af + 3495e5c
commit 4ca8f89
Show file tree

Hide file tree

Showing 2 changed files with 15 additions and 4 deletions.
diff --git a/Dockerfile b/Dockerfile
@@ -1,4 +1,4 @@
-FROM nvidia/cuda:11.8.0-cudnn8-runtime-ubuntu22.04
+FROM nvidia/cuda:12.2.2-cudnn8-devel-ubuntu22.04
 
 RUN \
   apt update && \

diff --git a/lib/main.py b/lib/main.py
@@ -10,9 +10,16 @@
 import os
 
 from fastapi import Depends, FastAPI, UploadFile, responses
-from nc_py_api import AsyncNextcloudApp, NextcloudApp
-from nc_py_api.ex_app import LogLvl, anc_app, run_app, set_handlers, persistent_storage
 from faster_whisper import WhisperModel
+from nc_py_api import AsyncNextcloudApp, NextcloudApp
+from nc_py_api.ex_app import (
+    anc_app,
+    get_computation_device,
+    LogLvl,
+    persistent_storage,
+    run_app,
+    set_handlers,
+)
 
 
 def load_models():
@@ -28,7 +35,11 @@ def load_models():
     return models
 
 def create_model_loader(file_path):
-    return lambda: WhisperModel(file_path, device="cpu")
+    device = get_computation_device().lower()
+    if device != "cuda":  # other GPUs are currently not supported by Whisper
+        device = "cpu"
+
+    return lambda: WhisperModel(file_path, device=device)
 
 
 models = load_models()