-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathmain.py
More file actions
136 lines (110 loc) · 4.17 KB
/
main.py
File metadata and controls
136 lines (110 loc) · 4.17 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
"""Language Detection API"""
import logging
import time
from os import environ
from typing import Annotated
from dotenv import load_dotenv
from litestar import Litestar, get, post
from litestar.config.cors import CORSConfig
from litestar.datastructures import State
from litestar.openapi import OpenAPIConfig
from litestar.params import Parameter
from litestar.response import Redirect
from litestar.status_codes import HTTP_200_OK
from app.http_exceptions import EmptyTextException
from app.language_utils import get_all_supported_languages
from app.schemas import DetectRequest, DetectResponse, LanguageInfo
from detectors.lingua_detector import LinguaDetector
from detectors.mediapipe_detector import MediaPipeDetector
# Setup logging
logging.basicConfig(
level=logging.INFO,
format="%(asctime)s - %(levelname)s - %(message)s"
)
logger = logging.getLogger(__name__)
load_dotenv()
# Initialize detectors lazily
_mediapipe_detector = None
_lingua_detector = None
def get_mediapipe_detector() -> MediaPipeDetector:
"""Get or initialize MediaPipe detector"""
global _mediapipe_detector
if _mediapipe_detector is None:
model_path = environ.get(
"MEDIAPIPE_MODEL_PATH", "/app/models/language_detector.tflite"
)
print(f"Initializing MediaPipe detector with model: {model_path}")
_mediapipe_detector = MediaPipeDetector(model_path)
print("✓ MediaPipe detector initialized")
return _mediapipe_detector
def get_lingua_detector() -> LinguaDetector:
"""Get or initialize Lingua detector"""
global _lingua_detector
if _lingua_detector is None:
print("Initializing Lingua detector...")
_lingua_detector = LinguaDetector()
print("✓ Lingua detector initialized")
return _lingua_detector
@get("/health", summary="Health check endpoint", include_in_schema=False)
async def health() -> dict:
"""Health check"""
return {"status": "ok"}
@post(
"/detect",
summary="Detect language of text",
description="Detect the language of provided text using MediaPipe (default) or Lingua detector",
status_code=HTTP_200_OK,
)
async def detect(data: DetectRequest) -> DetectResponse:
"""Detect language of text"""
start_time = time.time()
if not data.text or not data.text.strip():
raise EmptyTextException()
# Truncate text for logging (max 50 chars)
text_preview = data.text[:50] + "..." if len(data.text) > 50 else data.text
if data.method == "mediapipe":
detector = get_mediapipe_detector()
result = detector.detect(data.text)
response = DetectResponse(
language=result.language, confidence=result.confidence, method="mediapipe"
)
elif data.method == "lingua":
detector = get_lingua_detector()
result = detector.detect(data.text)
response = DetectResponse(
language=result.language, confidence=result.confidence, method="lingua"
)
else:
raise EmptyTextException()
# Calculate execution time
execution_time = (time.time() - start_time) * 1000 # Convert to milliseconds
# Log request info
confidence_str = f"{response.confidence:.2f}" if response.confidence is not None else "None"
logger.info(
f"[{execution_time:.0f}ms] input=\"{text_preview}\" -> {response.language}-{confidence_str},method={response.method}"
)
return response
@get(["/", "/docs"], include_in_schema=False)
async def docs() -> Redirect:
"""Redirect to API documentation"""
return Redirect("/schema")
@get(
"/detect/languages",
summary="Get supported languages",
description="Get list of all supported languages with their detection methods",
status_code=HTTP_200_OK,
)
async def get_languages() -> list[LanguageInfo]:
"""Get list of all supported languages"""
langs = get_all_supported_languages()
return [LanguageInfo(**lang) for lang in langs]
app = Litestar(
[health, detect, docs, get_languages],
openapi_config=OpenAPIConfig(
title="Language Detection API",
version="1.0.0",
root_schema_site="swagger",
description="Detect language of text using MediaPipe or Lingua",
),
cors_config=CORSConfig(),
)