File size: 2,228 Bytes
dc149ba
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
158e38e
dc149ba
 
 
 
 
 
3708fd3
dc149ba
 
 
 
 
 
 
 
 
 
 
 
592978b
dc149ba
 
2866119
dc149ba
 
 
 
 
 
2866119
dc149ba
 
2866119
dc149ba
f08dd12
592978b
f010b24
 
 
 
2866119
dc149ba
592978b
 
 
 
 
 
 
717e94d
dc149ba
 
cc4bac3
a7e8544
2866119
55f0629
 
 
3708fd3
 
55f0629
 
b44d3df
aad89b6
55f0629
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
"""
translation program for simple text
1. detect language from langdetect
2. translate to target language given by user

Example from
https://www.thepythoncode.com/article/machine-translation-using-huggingface-transformers-in-python 

user_input:
    string: string to be translated
    target_lang: language to be translated to

Returns:
    string: translated string of text
"""

import gradio as gr
import argparse

import langid
from transformers import pipeline


def detect_lang(article, target_lang):
    """
    Language Detection using library langid

    Args:
        article (string): article that user wish to translate
        target_lang (string): language user want to translate article into

    Returns:
        string: detected language short form
    """

    result_lang = langid.classify(article)
    return result_lang[0]


def opus_trans(article, target_language):
    """
    Translation by Helsinki-NLP model

    Args:
        article (string): article that user wishes to translate
        result_lang (string): detected language in short form
        target_language (string): language that user wishes to translate article into

    Returns:
        string: translated piece of article based off target_language
    """
    result_lang = detect_lang(article, target_language)

    if target_language == "English":
        target_lang = "en"
    elif target_language == "Chinese":
        target_lang = "zh"
    # result_lang = detect_lang(article, target_language)

    if result_lang != target_lang:
        task_name = f"translation_{result_lang}_to_{target_lang}"
        model_name = f"Helsinki-NLP/opus-mt-{result_lang}-{target_lang}"
        translator = pipeline(task_name, model=model_name, tokenizer=model_name)
        translated = translator(article)[0]["translation_text"]
        # print(translated)
    else:
        translated = "Error: You chose the same language as the article detected language. Please reselect target_language and try again."
    return translated


article = gr.Textbox()
lang_select = gr.Radio(["English", "Chinese"])
translate = gr.Interface(
    opus_trans,
    [
        article,
        lang_select,
    ],
    outputs=gr.Textbox(),
)

translate.launch()