alihan spesifiklestirildi

2025-06-14 15:59:16 +03:00
parent 11153dc757
commit 37935066ad
8 changed files with 365 additions and 496 deletions
--- a/model_manager.py
+++ b/model_manager.py
@@ -1,7 +1,7 @@
 #!/usr/bin/env python3
 """
-模型管理模块
-负责Whisper模型的加载、缓存和管理
+Model Management Module
+Responsible for loading, caching, and managing Whisper models
 """

 import os
@@ -11,86 +11,86 @@ from typing import Dict, Any
 import torch
 from faster_whisper import WhisperModel, BatchedInferencePipeline

-# 日志配置
+# Log configuration
 logger = logging.getLogger(__name__)

-# 全局模型实例缓存
+# Global model instance cache
 model_instances = {}

 def get_whisper_model(model_name: str, device: str, compute_type: str) -> Dict[str, Any]:
    """
-    获取或创建Whisper模型实例
+    Get or create Whisper model instance

    Args:
-        model_name: 模型名称 (tiny, base, small, medium, large-v1, large-v2, large-v3)
-        device: 运行设备 (cpu, cuda, auto)
-        compute_type: 计算类型 (float16, int8, auto)
+        model_name: Model name (tiny, base, small, medium, large-v1, large-v2, large-v3)
+        device: Running device (cpu, cuda, auto)
+        compute_type: Computation type (float16, int8, auto)

    Returns:
-        dict: 包含模型实例和配置的字典
+        dict: Dictionary containing model instance and configuration
    """
    global model_instances

-    # 验证模型名称
+    # Validate model name
    valid_models = ["tiny", "base", "small", "medium", "large-v1", "large-v2", "large-v3"]
    if model_name not in valid_models:
-        raise ValueError(f"无效的模型名称: {model_name}。有效的模型: {', '.join(valid_models)}")
+        raise ValueError(f"Invalid model name: {model_name}. Valid models: {', '.join(valid_models)}")

-    # 自动检测设备
+    # Auto-detect device
    if device == "auto":
        device = "cuda" if torch.cuda.is_available() else "cpu"
        compute_type = "float16" if device == "cuda" else "int8"

-    # 验证设备和计算类型
+    # Validate device and compute type
    if device not in ["cpu", "cuda"]:
-        raise ValueError(f"无效的设备: {device}。有效的设备: cpu, cuda")
+        raise ValueError(f"Invalid device: {device}. Valid devices: cpu, cuda")

    if device == "cuda" and not torch.cuda.is_available():
-        logger.warning("CUDA不可用，自动切换到CPU")
+        logger.warning("CUDA not available, automatically switching to CPU")
        device = "cpu"
        compute_type = "int8"

    if compute_type not in ["float16", "int8"]:
-        raise ValueError(f"无效的计算类型: {compute_type}。有效的计算类型: float16, int8")
+        raise ValueError(f"Invalid compute type: {compute_type}. Valid compute types: float16, int8")

    if device == "cpu" and compute_type == "float16":
-        logger.warning("CPU设备不支持float16计算类型，自动切换到int8")
+        logger.warning("CPU device does not support float16 computation type, automatically switching to int8")
        compute_type = "int8"

-    # 生成模型键
+    # Generate model key
    model_key = f"{model_name}_{device}_{compute_type}"

-    # 如果模型已实例化，直接返回
+    # If model is already instantiated, return directly
    if model_key in model_instances:
-        logger.info(f"使用缓存的模型实例: {model_key}")
+        logger.info(f"Using cached model instance: {model_key}")
        return model_instances[model_key]

-    # 清理GPU内存（如果使用CUDA）
+    # Clean GPU memory (if using CUDA)
    if device == "cuda":
        torch.cuda.empty_cache()

-    # 实例化模型
+    # Instantiate model
    try:
-        logger.info(f"加载Whisper模型: {model_name} 设备: {device} 计算类型: {compute_type}")
+        logger.info(f"Loading Whisper model: {model_name} device: {device} compute type: {compute_type}")

-        # 基础模型
+        # Base model
        model = WhisperModel(
            model_name,
            device=device,
            compute_type=compute_type,
-            download_root=os.environ.get("WHISPER_MODEL_DIR", None)  # 支持自定义模型目录
+            download_root=os.environ.get("WHISPER_MODEL_DIR", None)  # Support custom model directory
        )

-        # 批处理设置 - 默认启用批处理以提高速度
+        # Batch processing settings - batch processing enabled by default to improve speed
        batched_model = None
        batch_size = 0

-        if device == "cuda":  # 只在CUDA设备上使用批处理
-            # 根据显存大小确定合适的批大小
+        if device == "cuda":  # Only use batch processing on CUDA devices
+            # Determine appropriate batch size based on available memory
            if torch.cuda.is_available():
                gpu_mem = torch.cuda.get_device_properties(0).total_memory
                free_mem = gpu_mem - torch.cuda.memory_allocated()
-                # 根据GPU显存动态调整批大小
+                # Dynamically adjust batch size based on GPU memory
                if free_mem > 16e9:  # >16GB
                    batch_size = 32
                elif free_mem > 12e9:  # >12GB
@@ -99,17 +99,17 @@ def get_whisper_model(model_name: str, device: str, compute_type: str) -> Dict[s
                    batch_size = 8
                elif free_mem > 4e9:   # >4GB
                    batch_size = 4
-                else:                # 较小显存
+                else:                # Smaller memory
                    batch_size = 2

-                logger.info(f"可用GPU显存: {free_mem / 1e9:.2f} GB")
+                logger.info(f"Available GPU memory: {free_mem / 1e9:.2f} GB")
            else:
-                batch_size = 8  # 默认值
+                batch_size = 8  # Default value

-            logger.info(f"启用批处理加速，批大小: {batch_size}")
+            logger.info(f"Enabling batch processing acceleration, batch size: {batch_size}")
            batched_model = BatchedInferencePipeline(model=model)

-        # 创建结果对象
+        # Create result object
        result = {
            'model': model,
            'device': device,
@@ -119,20 +119,20 @@ def get_whisper_model(model_name: str, device: str, compute_type: str) -> Dict[s
            'load_time': time.time()
        }

-        # 缓存实例
+        # Cache instance
        model_instances[model_key] = result
        return result

    except Exception as e:
-        logger.error(f"加载模型失败: {str(e)}")
+        logger.error(f"Failed to load model: {str(e)}")
        raise

 def get_model_info() -> str:
    """
-    获取可用的Whisper模型信息
+    Get available Whisper model information

    Returns:
-        str: 模型信息的JSON字符串
+        str: JSON string of model information
    """
    import json

@@ -142,15 +142,15 @@ def get_model_info() -> str:
    devices = ["cpu", "cuda"] if torch.cuda.is_available() else ["cpu"]
    compute_types = ["float16", "int8"] if torch.cuda.is_available() else ["int8"]

-    # 支持的语言列表
+    # Supported language list
    languages = {
-        "zh": "中文", "en": "英语", "ja": "日语", "ko": "韩语", "de": "德语",
-        "fr": "法语", "es": "西班牙语", "ru": "俄语", "it": "意大利语",
-        "pt": "葡萄牙语", "nl": "荷兰语", "ar": "阿拉伯语", "hi": "印地语",
-        "tr": "土耳其语", "vi": "越南语", "th": "泰语", "id": "印尼语"
+        "zh": "Chinese", "en": "English", "ja": "Japanese", "ko": "Korean", "de": "German",
+        "fr": "French", "es": "Spanish", "ru": "Russian", "it": "Italian",
+        "pt": "Portuguese", "nl": "Dutch", "ar": "Arabic", "hi": "Hindi",
+        "tr": "Turkish", "vi": "Vietnamese", "th": "Thai", "id": "Indonesian"
    }

-    # 支持的音频格式
+    # Supported audio formats
    audio_formats = [".mp3", ".wav", ".m4a", ".flac", ".ogg", ".aac"]

    info = {