svanhvit's picture
add app file
e35b927
raw
history blame
1.09 kB
import gradio as gr
from transformers import pipeline
import tokenizer
title = "Textaleiðrétting fyrir íslensku"
description = "Hér má prófa tauganetslíkan sem leiðréttir margs konar málfars- og stafsetningarvillur í íslenskum texta."
translator = pipeline("translation", model="mideind/yfirlestur-icelandic-correction-byt5", max_length=512)
def split_text(text):
sentence_list = [i for i in tokenizer.split_into_sentences(text, original=True)]
return sentence_list
def predict(text):
text = text.replace("\n", " ")
translated = ""
for i in split_text(text):
# doesn't keep original string formatting, instead adds a space btw sentences
translated += translator(i.strip())[0]["translation_text"] + " "
return translated
iface = gr.Interface(
fn=predict,
inputs='text',
outputs='text',
title=title,
description=description,
examples=[["Kvitu fiðrildinn fljua firir utan gluggan."], ["Ég held þetta er ekki góður tími fara heimsókn."], ["Kver a þenan bússtað ja eða nei"]]
)
iface.launch()