Spaces:

LocaleNLP
/

english_darija

Sleeping

App Files Files Community

Mgolo commited on Aug 12

Commit

34f5d6a

verified ·

1 Parent(s): 83e8e50

Update app.py

Browse files

Files changed (1) hide show

app.py +9 -9

app.py CHANGED Viewed

@@ -20,14 +20,14 @@ import chardet
 # Device setup
 device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
-# Load Wolof MarianMT model from HF hub (cached manually)
 translator = None
 whisper_model = None
-def load_wolof_model():
     global translator
     if translator is None:
-        model_name = "LocaleNLP/eng_wolof"
         model = AutoModelForSeq2SeqLM.from_pretrained(model_name).to(device)
         tokenizer = MarianTokenizer.from_pretrained(model_name)
         translator = pipeline("translation", model=model, tokenizer=tokenizer, device=0 if device.type == 'cuda' else -1)
@@ -91,8 +91,8 @@ def extract_text_from_file(uploaded_file):
             raise ValueError("Unsupported file type")
 def translate(text):
-    translator = load_wolof_model()
-    lang_tag = ">>wol<<"
     paragraphs = text.split("\n")
     translated_output = []
@@ -136,8 +136,8 @@ def translate_and_return(text):
 # Gradio UI components
 with gr.Blocks() as demo:
-    gr.Markdown("## LocaleNLP English-to-Wolof Translator")
-    gr.Markdown("Upload English text, audio, or document to translate to Wolof using a custom MarianMT model.")
     with gr.Row():
         input_mode = gr.Radio(choices=["Text", "Audio", "File"], label="Select input mode", value="Text")
@@ -147,8 +147,8 @@ with gr.Blocks() as demo:
     file_input = gr.File(file_types=['.pdf', '.docx', '.html', '.htm', '.md', '.srt', '.txt'], label="Upload document", visible=False)
     extracted_text = gr.Textbox(label="Extracted / Transcribed Text", lines=10, interactive=False)
-    translate_button = gr.Button("Translate to Wolof")
-    output_text = gr.Textbox(label="Translated Wolof Text", lines=10, interactive=False)
     def update_visibility(mode):
         return {

 # Device setup
 device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
+# Load Darija MarianMT model from HF hub (cached manually)
 translator = None
 whisper_model = None
+def load_darija_model():
     global translator
     if translator is None:
+        model_name = "LocaleNLP/english_darija"
         model = AutoModelForSeq2SeqLM.from_pretrained(model_name).to(device)
         tokenizer = MarianTokenizer.from_pretrained(model_name)
         translator = pipeline("translation", model=model, tokenizer=tokenizer, device=0 if device.type == 'cuda' else -1)
             raise ValueError("Unsupported file type")
 def translate(text):
+    translator = load_darija_model()
+    lang_tag = ">>dar<<"
     paragraphs = text.split("\n")
     translated_output = []
 # Gradio UI components
 with gr.Blocks() as demo:
+    gr.Markdown("## LocaleNLP English-to-Darija Translator")
+    gr.Markdown("Upload English text, audio, or document to translate to Darija using Localenlp model.")
     with gr.Row():
         input_mode = gr.Radio(choices=["Text", "Audio", "File"], label="Select input mode", value="Text")
     file_input = gr.File(file_types=['.pdf', '.docx', '.html', '.htm', '.md', '.srt', '.txt'], label="Upload document", visible=False)
     extracted_text = gr.Textbox(label="Extracted / Transcribed Text", lines=10, interactive=False)
+    translate_button = gr.Button("Translate to Darija")
+    output_text = gr.Textbox(label="Translated Darija Text", lines=10, interactive=False)
     def update_visibility(mode):
         return {