File size: 648 Bytes
ca2b720
1d40b2d
ca2b720
1d40b2d
 
 
ca2b720
1d40b2d
 
 
 
ca2b720
1d40b2d
 
ca2b720
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
import gradio as gr
from transformers import AutoTokenizer, AutoModelForSeq2SeqLM

model_name = "tencent/Hunyuan-MT-7B"
tokenizer = AutoTokenizer.from_pretrained(model_name)
model = AutoModelForSeq2SeqLM.from_pretrained(model_name, device_map="auto")

def translate(text, src="vi", tgt="km"):
    inputs = tokenizer(text, return_tensors="pt").to(model.device)
    outputs = model.generate(**inputs, forced_bos_token_id=tokenizer.lang_code_to_id[tgt])
    return tokenizer.decode(outputs[0], skip_special_tokens=True)

demo = gr.Interface(fn=translate, inputs="text", outputs="text",
    title="Hunyuan-MT-7B Dịch Việt ↔ Khmer")
demo.launch()