File size: 815 Bytes
591b3b9
 
 
 
 
 
 
 
7f6b908
 
591b3b9
 
 
 
 
7f6b908
 
 
 
 
 
 
 
 
591b3b9
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
import gradio as gr
from transformers import AutoModelForSeq2SeqLM, NllbTokenizerFast

model_repo = "wtarit/nllb-600M-th-en"

model = AutoModelForSeq2SeqLM.from_pretrained(model_repo)
tokenizer = NllbTokenizerFast.from_pretrained(model_repo, src_lang="tha_Thai", tgt_lang="eng_Latn")

def translate(Text):
    inputs = tokenizer(Text, return_tensors="pt")
    translated_tokens = model.generate(
        **inputs, forced_bos_token_id=tokenizer.lang_code_to_id["eng_Latn"], max_length=64
    )
    return tokenizer.batch_decode(translated_tokens, skip_special_tokens=True)[0]

demo = gr.Interface(
    fn=translate, 
    inputs=[
        gr.components.Textbox(placeholder="Enter Thai text here...")
    ], 
    outputs=["text"],
    title="NLLB TH-EN Translation",
    allow_flagging="never",
    )

demo.launch()