Add model management: switch, download, delete models via admin panel and API

2026-01-29 01:45:10 +01:00
parent 0f336428a0
commit ee9465f661
6 changed files with 443 additions and 12 deletions
--- a/src/api/transcriptions.py
+++ b/src/api/transcriptions.py
@@ -6,7 +6,14 @@ import os
 import hashlib
 from src.config import settings
-from src.services.whisper_service import transcribe_audio, get_model_status
+from src.services.whisper_service import (
    transcribe_audio, 
    get_model_status, 
    get_available_models, 
    switch_model, 
    reload_model, 
    delete_model
 )
 from src.services.stats_service import log_usage
 from src.database.db import get_db
 from sqlalchemy.orm import Session
@@ -97,6 +104,55 @@ async def model_status_endpoint(api_key: str = Depends(verify_api_key)):
    return get_model_status()
@router.get("/available-models")
 async def list_available_models(api_key: str = Depends(verify_api_key)):
    """List all available Whisper models with download status"""
    return {
        "models": get_available_models()
    }
@router.post("/switch-model")
 async def switch_model_endpoint(
    model: str = Form(...),
    api_key: str = Depends(verify_api_key)
 ):
    """Switch to a different Whisper model"""
    try:
        result = switch_model(model)
        return result
    except ValueError as e:
        raise HTTPException(status_code=400, detail=str(e))
    except Exception as e:
        raise HTTPException(status_code=500, detail=str(e))
@router.post("/reload-model")
 async def reload_model_endpoint(api_key: str = Depends(verify_api_key)):
    """Reload current model (re-download)"""
    try:
        # This will run in background to not block the API
        result = reload_model()
        return result
    except Exception as e:
        raise HTTPException(status_code=500, detail=str(e))
@router.delete("/delete-model/{model_name}")
 async def delete_model_endpoint(
    model_name: str,
    api_key: str = Depends(verify_api_key)
 ):
    """Delete a downloaded model"""
    try:
        result = delete_model(model_name)
        return result
    except ValueError as e:
        raise HTTPException(status_code=400, detail=str(e))
    except Exception as e:
        raise HTTPException(status_code=500, detail=str(e))
@router.post("/audio/transcriptions")
 async def create_transcription(
    file: UploadFile = File(...),
--- a/src/services/whisper_service.py
+++ b/src/services/whisper_service.py
@@ -1,16 +1,18 @@
 import whisper
 import torch
 import os
-from typing import Optional, Dict, Any
+from typing import Optional, Dict, Any, List
 import asyncio
 from concurrent.futures import ThreadPoolExecutor
 import threading
 import time
 import shutil
 from src.config import settings
 # Global model cache
 _model = None
 _current_model_name = settings.whisper_model
 _executor = ThreadPoolExecutor(max_workers=1)
 _model_lock = threading.Lock()
@@ -25,6 +27,18 @@ _model_status = {
    "is_loaded": False
 }
 # Available Whisper models with their sizes (approximate)
 AVAILABLE_MODELS = {
    "tiny": {"size": "39 MB", "description": "Fastest, lowest accuracy", "english_only": False},
    "base": {"size": "74 MB", "description": "Fast, good for testing", "english_only": False},
    "small": {"size": "244 MB", "description": "Balanced speed/accuracy", "english_only": False},
    "medium": {"size": "769 MB", "description": "Good accuracy", "english_only": False},
    "large-v1": {"size": "1.55 GB", "description": "High accuracy (legacy)", "english_only": False},
    "large-v2": {"size": "2.87 GB", "description": "Higher accuracy", "english_only": False},
    "large-v3": {"size": "2.88 GB", "description": "Best accuracy", "english_only": False},
    "large": {"size": "2.88 GB", "description": "Alias for large-v3", "english_only": False},
 }
 def _download_hook(progress_bytes, total_bytes):
    """Hook to track download progress"""
@@ -37,28 +51,39 @@ def _download_hook(progress_bytes, total_bytes):
    _model_status["status_message"] = f"Downloading: {_model_status['download_percentage']}%"
-def load_model():
+def load_model(model_name: str = None):
    """Load Whisper model"""
-    global _model, _model_status
+    global _model, _model_status, _current_model_name
    if model_name is None:
        model_name = settings.whisper_model
    with _model_lock:
        # If a different model is loaded, unload it first
        if _model is not None and _current_model_name != model_name:
            print(f"Switching from {_current_model_name} to {model_name}")
            _model = None
            torch.cuda.empty_cache() if torch.cuda.is_available() else None
        if _model is None:
            _model_status["is_downloading"] = True
            _model_status["status_message"] = "Starting download..."
            _model_status["model_name"] = model_name
-            print(f"Loading Whisper model: {settings.whisper_model}")
+            print(f"Loading Whisper model: {model_name}")
            try:
                # Whisper doesn't have a direct progress callback, but we can monitor the models directory
                _model = whisper.load_model(
-                    settings.whisper_model,
+                    model_name,
                    device=settings.whisper_device,
                    download_root=settings.models_path
                )
                _current_model_name = model_name
                _model_status["is_downloading"] = False
                _model_status["is_loaded"] = True
                _model_status["download_percentage"] = 100
                _model_status["status_message"] = "Model loaded successfully"
-                print(f"Model loaded on {settings.whisper_device}")
+                print(f"Model {model_name} loaded on {settings.whisper_device}")
            except Exception as e:
                _model_status["is_downloading"] = False
                _model_status["status_message"] = f"Error: {str(e)}"
@@ -69,7 +94,7 @@ def load_model():
 def get_model_info():
    """Get model information"""
-    global _model_status
+    global _model_status, _current_model_name
    # Check if model files exist in the models directory
    model_files = []
@@ -87,15 +112,23 @@ def get_model_info():
            except:
                pass
-        # large-v3 is approximately 2.9GB
+        # Get expected size for current model
-        expected_size = 2.9 * 1024 * 1024 * 1024  # 2.9 GB in bytes
+        expected_size_gb = 2.9  # default to large-v3
        if _current_model_name in AVAILABLE_MODELS:
            size_str = AVAILABLE_MODELS[_current_model_name]["size"]
            if "GB" in size_str:
                expected_size_gb = float(size_str.replace(" GB", ""))
            elif "MB" in size_str:
                expected_size_gb = float(size_str.replace(" MB", "")) / 1024
        expected_size = expected_size_gb * 1024 * 1024 * 1024
        if total_size > 0:
            estimated_percentage = min(99, round((total_size / expected_size) * 100, 2))
            _model_status["download_percentage"] = estimated_percentage
            _model_status["status_message"] = f"Downloading: {estimated_percentage}%"
    return {
-        "name": settings.whisper_model,
+        "name": _current_model_name,
        "device": settings.whisper_device,
        "loaded": _model is not None,
        "is_downloading": _model_status["is_downloading"],
@@ -110,6 +143,94 @@ def get_model_status():
    return get_model_info()
 def get_available_models():
    """Get list of available models with their download status"""
    models_dir = settings.models_path
    downloaded_models = set()
    if os.path.exists(models_dir):
        for f in os.listdir(models_dir):
            if f.endswith('.pt'):
                # Extract model name from file (e.g., "large-v3.pt" -> "large-v3")
                model_name = f.replace('.pt', '')
                downloaded_models.add(model_name)
    result = []
    for model_name, info in AVAILABLE_MODELS.items():
        result.append({
            "name": model_name,
            "size": info["size"],
            "description": info["description"],
            "english_only": info["english_only"],
            "is_downloaded": model_name in downloaded_models,
            "is_active": model_name == _current_model_name and _model is not None
        })
    return result
 def switch_model(model_name: str):
    """Switch to a different model"""
    global _model, _current_model_name
    if model_name not in AVAILABLE_MODELS:
        raise ValueError(f"Unknown model: {model_name}")
    if model_name == _current_model_name and _model is not None:
        return {"status": "already_active", "message": f"Model {model_name} is already active"}
    # Load the new model
    load_model(model_name)
    return {"status": "success", "message": f"Switched to model {model_name}"}
 def delete_model(model_name: str):
    """Delete a downloaded model"""
    global _model, _current_model_name
    if model_name not in AVAILABLE_MODELS:
        raise ValueError(f"Unknown model: {model_name}")
    models_dir = settings.models_path
    model_file = os.path.join(models_dir, f"{model_name}.pt")
    if not os.path.exists(model_file):
        return {"status": "not_found", "message": f"Model {model_name} is not downloaded"}
    # If this model is currently loaded, unload it first
    if model_name == _current_model_name and _model is not None:
        _model = None
        torch.cuda.empty_cache() if torch.cuda.is_available() else None
        _current_model_name = None
    # Delete the file
    os.remove(model_file)
    return {"status": "success", "message": f"Model {model_name} deleted"}
 def reload_model():
    """Reload current model (useful for re-downloading)"""
    global _model
    with _model_lock:
        model_name = _current_model_name if _current_model_name else settings.whisper_model
        # Unload current model
        if _model is not None:
            _model = None
            torch.cuda.empty_cache() if torch.cuda.is_available() else None
        # Delete model file if exists
        models_dir = settings.models_path
        model_file = os.path.join(models_dir, f"{model_name}.pt")
        if os.path.exists(model_file):
            os.remove(model_file)
        # Reload model (will trigger download)
        load_model(model_name)
        return {"status": "success", "message": f"Model {model_name} reloaded"}
 def _transcribe_sync(
    audio_path: str,
    language: Optional[str] = None,
--- a/src/templates/dashboard.html
+++ b/src/templates/dashboard.html
@@ -9,6 +9,7 @@
        <div class="nav">
            <a href="/admin" class="active">Dashboard</a>
            <a href="/admin/keys">API Keys</a>
            <a href="/admin/models">Models</a>
            <a href="/admin/logout">Logout</a>
        </div>
    </div>
--- a/src/templates/keys.html
+++ b/src/templates/keys.html
@@ -9,6 +9,7 @@
        <div class="nav">
            <a href="/admin">Dashboard</a>
            <a href="/admin/keys" class="active">API Keys</a>
            <a href="/admin/models">Models</a>
            <a href="/admin/logout">Logout</a>
        </div>
    </div>
--- a/src/templates/models.html
+++ b/src/templates/models.html
@@ -0,0 +1,124 @@
 {% extends "base.html" %}
 {% block title %}Models - Whisper API Admin{% endblock %}
 {% block content %}
 <div class="container">
    <div class="header">
        <h1>🤖 Model Management</h1>
        <div class="nav">
            <a href="/admin">Dashboard</a>
            <a href="/admin/keys">API Keys</a>
            <a href="/admin/models" class="active">Models</a>
            <a href="/admin/logout">Logout</a>
        </div>
    </div>
    <!-- Current Model Status -->
    <div class="card">
        <h2>Current Model Status</h2>
        <div id="current-model-info">
            <p><strong>Active Model:</strong> {{ current_status.name }}</p>
            <p><strong>Device:</strong> {{ current_status.device }}</p>
            <p><strong>Status:</strong> 
                {% if current_status.loaded %}
                    <span style="color: #48bb78;">✅ Loaded & Ready</span>
                {% elif current_status.is_downloading %}
                    <span style="color: #ed8936;">⏳ Downloading ({{ current_status.download_percentage }}%)</span>
                {% else %}
                    <span style="color: #718096;">⏸️ Not Loaded</span>
                {% endif %}
            </p>
            {% if current_status.is_downloading %}
            <div style="background: #e2e8f0; border-radius: 10px; height: 20px; overflow: hidden; margin-top: 10px;">
                <div id="download-progress" style="background: linear-gradient(90deg, #667eea, #764ba2); height: 100%; width: {{ current_status.download_percentage }}%; transition: width 0.5s ease;"></div>
            </div>
            {% endif %}
        </div>
    </div>
    <!-- Available Models -->
    <div class="card">
        <h2>Available Models</h2>
        <table>
            <thead>
                <tr>
                    <th>Model</th>
                    <th>Size</th>
                    <th>Description</th>
                    <th>Status</th>
                    <th>Actions</th>
                </tr>
            </thead>
            <tbody>
                {% for model in models %}
                <tr>
                    <td><strong>{{ model.name }}</strong></td>
                    <td>{{ model.size }}</td>
                    <td>{{ model.description }}</td>
                    <td>
                        {% if model.is_active %}
                            <span class="badge badge-success">Active</span>
                        {% elif model.is_downloaded %}
                            <span class="badge" style="background: #bee3f8; color: #2c5282;">Downloaded</span>
                        {% else %}
                            <span class="badge badge-danger">Not Downloaded</span>
                        {% endif %}
                    </td>
                    <td>
                        {% if not model.is_active %}
                            <form method="POST" action="/admin/models/switch" style="display: inline;">
                                <input type="hidden" name="model_name" value="{{ model.name }}">
                                <button type="submit" class="btn" style="padding: 5px 10px; font-size: 12px;" 
                                    {% if not model.is_downloaded %}disabled{% endif %}>
                                    Activate
                                </button>
                            </form>
                        {% endif %}
                        {% if model.is_downloaded %}
                            <form method="POST" action="/admin/models/delete" style="display: inline; margin-left: 5px;"
                                  onsubmit="return confirm('Are you sure you want to delete this model?');">
                                <input type="hidden" name="model_name" value="{{ model.name }}">
                                <button type="submit" class="btn btn-danger" style="padding: 5px 10px; font-size: 12px;"
                                    {% if model.is_active %}disabled{% endif %}>
                                    Delete
                                </button>
                            </form>
                        {% else %}
                            <form method="POST" action="/admin/models/download" style="display: inline; margin-left: 5px;">
                                <input type="hidden" name="model_name" value="{{ model.name }}">
                                <button type="submit" class="btn btn-success" style="padding: 5px 10px; font-size: 12px;">
                                    Download
                                </button>
                            </form>
                        {% endif %}
                    </td>
                </tr>
                {% endfor %}
            </tbody>
        </table>
    </div>
    <!-- Reload Current Model -->
    <div class="card">
        <h2>Reload Current Model</h2>
        <p>If you experience issues with the current model, you can reload it. This will delete and re-download the model files.</p>
        <form method="POST" action="/admin/models/reload" onsubmit="return confirm('This will delete and re-download the current model. Continue?');">
            <button type="submit" class="btn" style="background: #ed8936;">
                🔄 Reload Model
            </button>
        </form>
    </div>
 </div>
 <script>
 // Auto-refresh page every 5 seconds if downloading
 {% if current_status.is_downloading %}
 setTimeout(function() {
    window.location.reload();
 }, 5000);
 {% endif %}
 </script>
 {% endblock %}
--- a/src/web/routes.py
+++ b/src/web/routes.py
@@ -11,7 +11,7 @@ from src.config import settings
 from src.database.db import get_db
 from src.database.models import ApiKey, UsageLog
 from src.services.stats_service import get_usage_stats, hash_api_key
-from src.services.whisper_service import get_model_status
+from src.services.whisper_service import get_model_status, get_available_models
 router = APIRouter()
 templates = Jinja2Templates(directory="src/templates")
@@ -188,3 +188,131 @@ async def delete_key(
        db.commit()
    return RedirectResponse(url="/admin/keys", status_code=302)
@router.get("/models", response_class=HTMLResponse)
 async def manage_models(request: Request, message: Optional[str] = None, error: Optional[str] = None):
    """Model management page"""
    try:
        check_admin_auth(request)
    except HTTPException as e:
        return RedirectResponse(url="/admin/login", status_code=302)
    models = get_available_models()
    current_status = get_model_status()
    return templates.TemplateResponse("models.html", {
        "request": request,
        "models": models,
        "current_status": current_status,
        "message": message,
        "error": error
    })
@router.post("/models/switch")
 async def switch_model_admin(
    request: Request,
    model_name: str = Form(...)
 ):
    """Switch to a different model"""
    try:
        check_admin_auth(request)
    except HTTPException as e:
        return RedirectResponse(url="/admin/login", status_code=302)
    try:
        from src.services.whisper_service import switch_model
        result = switch_model(model_name)
        return RedirectResponse(
            url=f"/admin/models?message={result['message']}", 
            status_code=302
        )
    except Exception as e:
        return RedirectResponse(
            url=f"/admin/models?error={str(e)}", 
            status_code=302
        )
@router.post("/models/delete")
 async def delete_model_admin(
    request: Request,
    model_name: str = Form(...)
 ):
    """Delete a model"""
    try:
        check_admin_auth(request)
    except HTTPException as e:
        return RedirectResponse(url="/admin/login", status_code=302)
    try:
        from src.services.whisper_service import delete_model
        result = delete_model(model_name)
        return RedirectResponse(
            url=f"/admin/models?message={result['message']}", 
            status_code=302
        )
    except Exception as e:
        return RedirectResponse(
            url=f"/admin/models?error={str(e)}", 
            status_code=302
        )
@router.post("/models/download")
 async def download_model_admin(
    request: Request,
    model_name: str = Form(...)
 ):
    """Download a model"""
    try:
        check_admin_auth(request)
    except HTTPException as e:
        return RedirectResponse(url="/admin/login", status_code=302)
    try:
        from src.services.whisper_service import load_model
        # Start download in background (non-blocking for API)
        import threading
        def download():
            try:
                load_model(model_name)
            except Exception as e:
                print(f"Error downloading model {model_name}: {e}")
        thread = threading.Thread(target=download)
        thread.daemon = True
        thread.start()
        return RedirectResponse(
            url=f"/admin/models?message=Started downloading model {model_name}", 
            status_code=302
        )
    except Exception as e:
        return RedirectResponse(
            url=f"/admin/models?error={str(e)}", 
            status_code=302
        )
@router.post("/models/reload")
 async def reload_model_admin(request: Request):
    """Reload current model"""
    try:
        check_admin_auth(request)
    except HTTPException as e:
        return RedirectResponse(url="/admin/login", status_code=302)
    try:
        from src.services.whisper_service import reload_model
        result = reload_model()
        return RedirectResponse(
            url=f"/admin/models?message={result['message']}", 
            status_code=302
        )
    except Exception as e:
        return RedirectResponse(
            url=f"/admin/models?error={str(e)}", 
            status_code=302
        )