Spaces:

gauravchand11
/

Doc_Translation_Toolkit

Sleeping

App Files Files Community

gauravchand11 commited on Apr 24

Commit

ee20cf3

verified ·

1 Parent(s): 2e6a73b

Update app.py

Browse files

Files changed (1) hide show

app.py +16 -30

app.py CHANGED Viewed

@@ -7,12 +7,6 @@ import re
 import torch
 from datetime import datetime
 import pytz
-from reportlab.pdfgen import canvas
-from reportlab.pdfbase import pdfmetrics
-from reportlab.pdfbase.ttfonts import TTFont
-from reportlab.lib.pagesizes import A4
-from reportlab.lib.units import inch
-from reportlab.pdfbase.cidfonts import UnicodeCIDFont
 from io import BytesIO
 from docx import Document
 import tempfile
@@ -303,7 +297,7 @@ def translate_text(text, src_lang, tgt_lang):
         return f"Error during translation: {str(e)}"
 # Document translation function
-def translate_document(file, source_lang, target_lang, output_format="txt"):
     try:
         if file is None:
             return "Please upload a file", None
@@ -318,30 +312,24 @@ def translate_document(file, source_lang, target_lang, output_format="txt"):
         # Translate
         translated_text = translate_text(input_text, source_lang, target_lang)
         # Create temporary file
         temp_dir = tempfile.gettempdir()
-        # Handle output format based on user selection and input type
         if input_ext == '.pdf':
-            # For PDF inputs, use the selected output format
-            if output_format == "docx":
-                output_filename = f"translated_{os.path.splitext(os.path.basename(file.name))[0]}.docx"
-                output_path = os.path.join(temp_dir, output_filename)
-                doc = Document()
-                for paragraph in translated_text.split('\n'):
-                    if paragraph.strip():
-                        doc.add_paragraph(paragraph)
-                doc.save(output_path)
-            else:  # default to txt
-                output_filename = f"translated_{os.path.splitext(os.path.basename(file.name))[0]}.txt"
-                output_path = os.path.join(temp_dir, output_filename)
-                with open(output_path, 'w', encoding='utf-8') as f:
-                    f.write(translated_text)
         elif input_ext == '.docx':
             # Create DOCX
-            output_filename = f"translated_{os.path.splitext(os.path.basename(file.name))[0]}.docx"
-            output_path = os.path.join(temp_dir, output_filename)
             doc = Document()
             for paragraph in translated_text.split('\n'):
                 if paragraph.strip():
@@ -349,9 +337,7 @@ def translate_document(file, source_lang, target_lang, output_format="txt"):
             doc.save(output_path)
         else:
-            # Default to txt for other formats
-            output_filename = f"translated_{os.path.splitext(os.path.basename(file.name))[0]}.txt"
-            output_path = os.path.join(temp_dir, output_filename)
             with open(output_path, 'w', encoding='utf-8') as f:
                 f.write(translated_text)
@@ -377,8 +363,8 @@ def create_interface():
     header = gr.Markdown(
         f"""
         # Document Translation Toolkit
-        **Current Date and Time (UTC):** {get_current_time()}
-        **Current User's Login:** gauravchand
         """
     )

 import torch
 from datetime import datetime
 import pytz
 from io import BytesIO
 from docx import Document
 import tempfile
         return f"Error during translation: {str(e)}"
 # Document translation function
+def translate_document(file, source_lang, target_lang):
     try:
         if file is None:
             return "Please upload a file", None
         # Translate
         translated_text = translate_text(input_text, source_lang, target_lang)
+        # Create output file with .txt extension for PDF inputs, otherwise same as input
+        if input_ext == '.pdf':
+            output_filename = f"translated_{os.path.splitext(os.path.basename(file.name))[0]}.txt"
+        else:
+            output_filename = f"translated_{os.path.splitext(os.path.basename(file.name))[0]}{input_ext}"
         # Create temporary file
         temp_dir = tempfile.gettempdir()
+        output_path = os.path.join(temp_dir, output_filename)
+        # Create appropriate file format
         if input_ext == '.pdf':
+            # Save as txt file
+            with open(output_path, 'w', encoding='utf-8') as f:
+                f.write(translated_text)
         elif input_ext == '.docx':
             # Create DOCX
             doc = Document()
             for paragraph in translated_text.split('\n'):
                 if paragraph.strip():
             doc.save(output_path)
         else:
+            # Default to txt
             with open(output_path, 'w', encoding='utf-8') as f:
                 f.write(translated_text)
     header = gr.Markdown(
         f"""
         # Document Translation Toolkit
+        *Current Date and Time (UTC):* {get_current_time()}
+        *Current User's Login:* gauravchand
         """
     )