Spaces:

pdltiet
/

PDL_translate

Sleeping

App Files Files Community

vteam27 commited on Feb 1, 2024

Commit

79868fd

1 Parent(s): ef6d6f0

Added upload button

Browse files

Files changed (2) hide show

app.py +9 -7
lang_list.py +1 -93

app.py CHANGED Viewed

@@ -16,7 +16,9 @@ processor = AutoProcessor.from_pretrained("facebook/hf-seamless-m4t-medium")
 # print(translated_text_from_text)
-def run_t2tt(input_text: str, source_language: str, target_language: str) -> str:
     source_language_code = LANGUAGE_NAME_TO_CODE[source_language]
     target_language_code = LANGUAGE_NAME_TO_CODE[target_language]
     text_inputs = processor(text = input_text, src_lang=source_language_code , return_tensors="pt")
@@ -25,17 +27,17 @@ def run_t2tt(input_text: str, source_language: str, target_language: str) -> str
     return str(output)
 with gr.Blocks() as demo_t2tt:
     with gr.Row():
         with gr.Column():
             with gr.Group():
                 input_text = gr.Textbox(label="Input text")
                 with gr.Row():
                     source_language = gr.Dropdown(
                         label="Source language",
                         choices=TEXT_SOURCE_LANGUAGE_NAMES,
-                        value="English",
                     )
                     target_language = gr.Dropdown(
                         label="Target language",
@@ -49,7 +51,7 @@ with gr.Blocks() as demo_t2tt:
     gr.Examples(
         examples=[
             [
-                "The sinister destruction of the holy Akal Takht and the ruthless massacre of thousands of innocent pilgrims had unmasked the deep-seated hatred and animosity that the Indian Government had been nurturing against Sikhs ever since inde- pendence",
                 "English",
                 "Punjabi",
             ],
@@ -69,17 +71,17 @@ with gr.Blocks() as demo_t2tt:
                 "English",
             ],
         ],
-        inputs=[input_text, source_language, target_language],
         outputs=output_text,
         fn=run_t2tt,
-        cache_examples=True,
         api_name=False,
     )
     gr.on(
         triggers=[input_text.submit, btn.click],
         fn=run_t2tt,
-        inputs=[input_text, source_language, target_language],
         outputs=output_text,
         api_name="t2tt",
     )

 # print(translated_text_from_text)
+def run_t2tt(file_uploader , input_text: str, source_language: str, target_language: str) -> str:
+    if file_uploader is not None:
+        input_text = file_uploader.read().decode("utf-8")
     source_language_code = LANGUAGE_NAME_TO_CODE[source_language]
     target_language_code = LANGUAGE_NAME_TO_CODE[target_language]
     text_inputs = processor(text = input_text, src_lang=source_language_code , return_tensors="pt")
     return str(output)
 with gr.Blocks() as demo_t2tt:
     with gr.Row():
         with gr.Column():
             with gr.Group():
+                file_uploader = gr.File(label="Upload a text file (Optional)", type="txt")
                 input_text = gr.Textbox(label="Input text")
                 with gr.Row():
                     source_language = gr.Dropdown(
                         label="Source language",
                         choices=TEXT_SOURCE_LANGUAGE_NAMES,
+                        value="Punjabi",
                     )
                     target_language = gr.Dropdown(
                         label="Target language",
     gr.Examples(
         examples=[
             [
+                "The sinister destruction of the holy Akal Takht and the ruthless massacre of thousands of innocent pilgrims had unmasked the deep-seated hatred and animosity that the Indian Government had been nurturing against Sikhs ever since independence",
                 "English",
                 "Punjabi",
             ],
                 "English",
             ],
         ],
+        inputs=[file_uploader ,input_text, source_language, target_language],
         outputs=output_text,
         fn=run_t2tt,
+        cache_examples=False,
         api_name=False,
     )
     gr.on(
         triggers=[input_text.submit, btn.click],
         fn=run_t2tt,
+        inputs=[file_uploader, input_text, source_language, target_language],
         outputs=output_text,
         api_name="t2tt",
     )

lang_list.py CHANGED Viewed

@@ -108,101 +108,9 @@ LANGUAGE_NAME_TO_CODE = {v: k for k, v in language_code_to_name.items()}
 # Source langs: S2ST / S2TT / ASR don't need source lang
 # T2TT / T2ST use this
 text_source_language_codes = [
-    "afr",
-    "amh",
-    "arb",
-    "ary",
-    "arz",
-    "asm",
-    "azj",
-    "bel",
-    "ben",
-    "bos",
-    "bul",
-    "cat",
-    "ceb",
-    "ces",
-    "ckb",
-    "cmn",
-    "cym",
-    "dan",
-    "deu",
-    "ell",
-    "eng",
-    "est",
-    "eus",
-    "fin",
-    "fra",
-    "gaz",
-    "gle",
-    "glg",
-    "guj",
-    "heb",
     "hin",
-    "hrv",
-    "hun",
-    "hye",
-    "ibo",
-    "ind",
-    "isl",
-    "ita",
-    "jav",
-    "jpn",
-    "kan",
-    "kat",
-    "kaz",
-    "khk",
-    "khm",
-    "kir",
-    "kor",
-    "lao",
-    "lit",
-    "lug",
-    "luo",
-    "lvs",
-    "mai",
-    "mal",
-    "mar",
-    "mkd",
-    "mlt",
-    "mni",
-    "mya",
-    "nld",
-    "nno",
-    "nob",
-    "npi",
-    "nya",
-    "ory",
     "pan",
-    "pbt",
-    "pes",
-    "pol",
-    "por",
-    "ron",
-    "rus",
-    "slk",
-    "slv",
-    "sna",
-    "snd",
-    "som",
-    "spa",
-    "srp",
-    "swe",
-    "swh",
-    "tam",
-    "tel",
-    "tgk",
-    "tgl",
-    "tha",
-    "tur",
-    "ukr",
-    "urd",
-    "uzn",
-    "vie",
-    "yor",
-    "yue",
-    "zsm",
-    "zul",
 ]
 TEXT_SOURCE_LANGUAGE_NAMES = sorted([language_code_to_name[code] for code in text_source_language_codes])

 # Source langs: S2ST / S2TT / ASR don't need source lang
 # T2TT / T2ST use this
 text_source_language_codes = [
     "hin",
     "pan",
+    "eng",
 ]
 TEXT_SOURCE_LANGUAGE_NAMES = sorted([language_code_to_name[code] for code in text_source_language_codes])