tilmash-gemma3-translator / utils /text_processing.py
asasasaasasa's picture
Upload folder using huggingface_hub
3c3ac9d verified
raw
history blame contribute delete
374 Bytes
# utils/text_processing.py
from langdetect import detect, DetectorFactory
DetectorFactory.seed = 0
def detect_language(text):
try:
lang = detect(text)
# Convert 'kk' from langdetect if it indeed returns 'kk' for Kazakh
if lang not in ['ru', 'en', 'kk']:
return None
return lang
except:
return None