Spaces:
Sleeping
Sleeping
| from transformers import pipeline | |
| from src.utils.config import DALAT5_MODEL | |
| from typing import List | |
| class DalaTransliterator: | |
| """ | |
| Simple wrapper for the DalaT5 transliterator model. | |
| """ | |
| def __init__(self, model_name: str = DALAT5_MODEL): | |
| self.pipe = pipeline("text2text-generation", model = model_name) | |
| def transliterate(self, text: str, max_length: int = 128) -> str: | |
| """ | |
| Transliterate a given text using DalaT5. | |
| """ | |
| input_text = f"Cyrillic2Latin: {text.strip()}" | |
| result = self.pipe(input_text, max_length = max_length) | |
| return result[0]["generated_text"] | |
| def batch_transliterate(self, texts: list[str], max_length: int = 128) -> List[str]: | |
| """ | |
| Perform batch transliteration using DalaT5. | |
| """ | |
| return [self.transliterate(t, max_length) for t in texts] |