Spaces:

CodeTed
/

chinese_spelling_error_correction

Running

File size: 1,181 Bytes

e7ebace
abbaadb
 
 
 
 
0fecaab
5cda2b6
3970b0a
abbaadb
 
e7ebace
0cbca3d
3970b0a
 
736df11
 
 
3970b0a
 
0cbca3d
aee24dc
0cbca3d
aee24dc
0cbca3d
 
 
64fe5a1
0cbca3d

import gradio as gr
from transformers import AutoTokenizer, T5ForConditionalGeneration
tokenizer = AutoTokenizer.from_pretrained("CodeTed/traditional_CSC_t5")
model = T5ForConditionalGeneration.from_pretrained("CodeTed/traditional_CSC_t5")


def cged_correction(sentence = '為了降低少子化，政府可以堆動獎勵生育的政策。'):
    input_ids = tokenizer('糾正句子裡的錯字：' + sentence, return_tensors="pt").input_ids
    outputs = model.generate(input_ids, max_length=200)
    edited_text = tokenizer.decode(outputs[0], skip_special_tokens=True)
    return edited_text

with gr.Blocks() as demo:
    gr.Markdown(
        """
    # 中文錯別字校正 - Chinese Spelling Correction
    ### Find Spelling Error and do the correction！
    Start typing below to see the correction.
    """
    )
    #設定輸入元件
    sent = gr.Textbox(label="Sentence", placeholder="input the sentence")
    # 設定輸出元件
    output = gr.Textbox(label="Result", placeholder="correction")
    #設定按鈕
    greet_btn = gr.Button("Correction")
    #設定按鈕點選事件
    greet_btn.click(fn=cged_correction, inputs=sent, outputs=output)
demo.launch()