differ/app.py at master · sh1man/differ · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
"""
FastAPI приложение для оценки качества ASR.
"""
from fastapi import FastAPI, HTTPException
from pydantic import BaseModel, Field
import jiwer
from config import create_config
from utils import preprocess_text

app = FastAPI(
    title="ASR Differ API",
    description="API для сравнения эталонного текста с результатом ASR и расчета метрик WER/CER",
    version="0.1.0"
)

config = create_config()


class CompareRequest(BaseModel):
    """Запрос на сравнение текстов."""
    reference_text: str = Field(..., description="Эталонный (идеальный) текст")
    hypothesis_text: str = Field(..., description="Текст, распознанный ASR системой")

    model_config = {
        "json_schema_extra": {
            "examples": [
                {
                    "reference_text": "всем добрый день у нас 2024 год",
                    "hypothesis_text": "Всем добрый день. У нас две тысячи двадцать четвёртый год."
                }
            ]
        }
    }


class CompareResponse(BaseModel):
    """Результат сравнения текстов."""
    wer: float = Field(..., description="Word Error Rate (процент ошибок на уровне слов)")
    cer: float = Field(..., description="Character Error Rate (процент ошибок на уровне символов)")
    total_errors: int = Field(..., description="Общее количество ошибок (S+D+I)")
    substitutions: int = Field(..., description="Количество замен (S)")
    deletions: int = Field(..., description="Количество удалений (D)")
    insertions: int = Field(..., description="Количество вставок (I)")
    total_words: int = Field(..., description="Общее количество слов в эталонном тексте")
    reference_normalized: str = Field(..., description="Нормализованный эталонный текст")
    hypothesis_normalized: str = Field(..., description="Нормализованный ASR текст")

    model_config = {
        "json_schema_extra": {
            "examples": [
                {
                    "wer": 0.0345,
                    "cer": 0.0123,
                    "total_errors": 12,
                    "substitutions": 8,
                    "deletions": 2,
                    "insertions": 2,
                    "total_words": 347,
                    "reference_normalized": "всем добрый день у нас две тысячи двадцать четыре год",
                    "hypothesis_normalized": "всем добрый день у нас две тысячи двадцать четыре год"
                }
            ]
        }
    }


@app.get("/")
async def root():
    """Информация о API."""
    return {
        "name": "ASR Differ API",
        "version": "0.1.0",
        "description": "API для оценки качества ASR систем",
        "endpoints": {
            "/compare": "POST - Сравнить эталонный и ASR тексты",
            "/health": "GET - Проверка работоспособности",
            "/docs": "GET - Swagger документация",
        }
    }


@app.get("/health")
async def health_check():
    """Проверка работоспособности сервиса."""
    return {"status": "ok", "gemini_configured": bool(config.gemini_api_key)}


@app.post("/compare", response_model=CompareResponse)
async def compare_texts(request: CompareRequest):
    """
    Сравнивает эталонный текст с текстом, распознанным ASR системой.

    Рассчитывает метрики:
    - WER (Word Error Rate) - процент ошибок на уровне слов
    - CER (Character Error Rate) - процент ошибок на уровне символов
    - Подсчет замен, удалений и вставок

    Автоматически выполняет нормализацию чисел через Gemini AI.

    Args:
        request: Запрос с эталонным и ASR текстами

    Returns:
        CompareResponse: Результаты сравнения и метрики
    """
    try:
        # Предобработка текстов с AI нормализацией
        reference_norm = preprocess_text(request.reference_text, config)
        hypothesis_norm = preprocess_text(request.hypothesis_text, config)

        # Расчет метрик на уровне слов
        word_output = jiwer.process_words(reference_norm, hypothesis_norm)

        wer = word_output.wer
        substitutions = word_output.substitutions
        deletions = word_output.deletions
        insertions = word_output.insertions
        total_errors = substitutions + deletions + insertions
        total_words = len(reference_norm.split())

        # Расчет метрик на уровне символов
        char_output = jiwer.process_characters(reference_norm, hypothesis_norm)
        cer = char_output.cer

        return CompareResponse(
            wer=wer,
            cer=cer,
            total_errors=total_errors,
            substitutions=substitutions,
            deletions=deletions,
            insertions=insertions,
            total_words=total_words,
            reference_normalized=reference_norm,
            hypothesis_normalized=hypothesis_norm
        )

    except Exception as e:
        raise HTTPException(
            status_code=500,
            detail=f"Ошибка при обработке текстов: {str(e)}"
        )


if __name__ == "__main__":
    import uvicorn
    uvicorn.run(app, host="0.0.0.0", port=8000)