Spaces:

Mamadou2727
/

Feriji_Translator

Sleeping

App Files Files Community

Mamadou2727 commited on Dec 6, 2023

Commit

d3ee320

1 Parent(s): 1dc68ce

Update

Browse files

Files changed (1) hide show

app.py +35 -23

app.py CHANGED Viewed

@@ -1,10 +1,7 @@
 import gradio as gr
-from transformers import AutoTokenizer, AutoModelForSeq2SeqLM
 import torch
-import base64
-import io
-# Load the model and tokenizer
 model = AutoModelForSeq2SeqLM.from_pretrained("Mamadou2727/Feriji_model")
 tokenizer = AutoTokenizer.from_pretrained("facebook/m2m100_418M")
 device = "cuda:0" if torch.cuda.is_available() else "cpu"
@@ -15,8 +12,9 @@ LANG_CODES = {
 def translate(text, candidates: int):
     """
-    Translate the text from French to Zarma.
     """
     src = LANG_CODES["French"]
     tgt = LANG_CODES["Zarma"]
@@ -29,7 +27,7 @@ def translate(text, candidates: int):
         'return_dict_in_generate': True,
         'output_scores': True,
         'output_hidden_states': True,
-        'length_penalty': 0.0,
         'num_return_sequences': candidates,
         'num_beams': candidates,
         'forced_bos_token_id': tokenizer.lang_code_to_id[tgt]
@@ -40,29 +38,43 @@ def translate(text, candidates: int):
     return '\n'.join(output)
-def translate_file(uploaded_file, candidates: int):
-    if uploaded_file is None:
-        return "No file uploaded."
-    # Decode the file content
-    file_content = base64.b64decode(uploaded_file['data'].split(',')[1])
-    text = io.BytesIO(file_content).read().decode("utf-8").strip()
-    return translate(text, candidates)
 with gr.Blocks() as app:
     with gr.Row():
-        gr.Markdown("Your markdown content here")
         with gr.Column():
             input_text = gr.components.Textbox(lines=7, label="Input Text", value="")
             return_seqs = gr.Slider(label="Number of return sequences", value=1, minimum=1, maximum=12, step=1)
             outputs = gr.Textbox(lines=7, label="Output Text")
-            translate_btn = gr.Button("Translate Text")
-            translate_btn.click(translate, inputs=[input_text, return_seqs], outputs=outputs)
-            upload_file = gr.File(label="Upload File")
-            translate_file_btn = gr.Button("Translate Uploaded File")
-            translate_file_btn.click(translate_file, inputs=[upload_file, return_seqs], outputs=outputs)
 app.launch(share=True)

 import gradio as gr
+from transformers import AutoTokenizer, AutoModelForSeq2SeqLM, pipeline
 import torch
 model = AutoModelForSeq2SeqLM.from_pretrained("Mamadou2727/Feriji_model")
 tokenizer = AutoTokenizer.from_pretrained("facebook/m2m100_418M")
 device = "cuda:0" if torch.cuda.is_available() else "cpu"
 def translate(text, candidates: int):
     """
+    Translate the text from French to Zarma
     """
     src = LANG_CODES["French"]
     tgt = LANG_CODES["Zarma"]
         'return_dict_in_generate': True,
         'output_scores': True,
         'output_hidden_states': True,
+        'length_penalty': 0.0,  # don't encourage longer or shorter output,
         'num_return_sequences': candidates,
         'num_beams': candidates,
         'forced_bos_token_id': tokenizer.lang_code_to_id[tgt]
     return '\n'.join(output)
 with gr.Blocks() as app:
+    markdown = r"""
+        # Feriji-fr-to-dje v.1.1, Proudly made by Elysabhete, Habibatou & Mamadou K.
+        <img src="https://cdn-uploads.huggingface.co/production/uploads/63cc1d4bf488db9bb3c6449e/AtOKLAaL5kt0VhRsxE0vf.png" width="500" height="300">
+        Feriji-fr-to-dje is a beta version of the French to Zarma translator.
+        ## Intended Uses & Limitations
+        This model is intended for academic research and practical applications in machine translation. It can be used to translate French text to Zarma and vice versa. Users should note that the model's performance may vary based on the complexity and context of the input text.
+        ## Authors:
+        The project, **Feriji dataset and Feriji-fr-to-dje**, was curated by **Elysabhete Ibrahim Amadou** and **Mamadou K. KEITA**, with the aim to enhance linguistic studies and translation capabilities between French and Zarma.
+        ## Citations
+        If you use this dataset or model in your research, please cite it as follows:
+        @dataset{Feriji,
+          author       = {Habibatou Abdoulaye Alfari, Elysabhete Ibrahim Amadou and Mamadou K. KEITA},
+          title        = {Feriji, a French-Zarma Parallel Corpus},
+          year         = 2023,
+          publisher    = {GitHub},
+          journal      = {GitHub repository},
+          howpublished = {\url{https://github.com/27-GROUP/Feriji}}
+        }
+    """
     with gr.Row():
+        gr.Markdown(markdown)
         with gr.Column():
             input_text = gr.components.Textbox(lines=7, label="Input Text", value="")
             return_seqs = gr.Slider(label="Number of return sequences", value=1, minimum=1, maximum=12, step=1)
             outputs = gr.Textbox(lines=7, label="Output Text")
+            translate_btn = gr.Button("Traduis!")
+            translate_btn.click(translate, inputs=[input_text, return_seqs], outputs=outputs)
 app.launch(share=True)