Spaces:

mintlee
/

MT_deploy

Running

App Files Files Community

mintlee commited on Jun 7

Commit

dee7654

1 Parent(s): 1b6f99d

add fix translate word

Browse files

Files changed (2) hide show

word/__pycache__/word_helper.cpython-310.pyc +0 -0
word/word_helper.py +9 -53

word/__pycache__/word_helper.cpython-310.pyc CHANGED Viewed

Binary files a/word/__pycache__/word_helper.cpython-310.pyc and b/word/__pycache__/word_helper.cpython-310.pyc differ

word/word_helper.py CHANGED Viewed

@@ -26,65 +26,21 @@ def batch_translate(texts, source_lang = 'English', target_lang="Vietnamese"):
     if not texts:
         return texts  # Skip if empty
-    system_prompt = """
-    Translate the contents of a JSON file from the specified source language to the specified target language while preserving the structure, spaces, and context of the original text.
-        Instructions:
-        1. You will be given three inputs: source language, target language, and a JSON file.
-        2. The JSON file contains a Python dictionary where each key is an integer, and each value is a string.
-        3. Ensure one-to-one correspondence—each input item must correspond to exactly one output item with the same number of items.
-        4. The names of people, places, and organizations should be preserved in the translation.
-        5. Preserve spaces before or after strings. Do not remove, merge, split, or omit any strings.
-        6. Translate paragraphs and ensure the translation makes sense when text is put together.
-        7. Translate split words so that the word is not split in the translation.
-        8. Return a JSON object that is a Python dictionary containing as many items as the original JSON file, with keys and order preserved.
-        9. The output must be a syntactically correct Python dictionary.
-        Additional Examples:
-        **Input 1**:
-        - Source language: English
-        - Target language: Vietnamese
-        - JSON file:
-        ```json
-        {"0": "My name is ", "1": "Huy", "2": ".", "3": " Today is ", "4": "a ", "5": "good day", "6": ".", "7": ""}
-        ```
-        **Output 1**:
-        ```json
-        {"0": "Tên tôi là ", "1": "Huy", "2": ".", "3": " Hôm nay là ", "4": "một ", "5": "ngày đẹp", "6": ".", "7": ""}
-        ```
-        **Input 2**:
-        - Source language: English
-        - Target language: Spanish
-        - JSON file:
-        ```json
-        {"0": "The sky is ", "1": "blue", "2": ".", "3": " Water is ", "4": "essential", "5": " for ", "6": "life", "7": "."}
-        ```
-        **Output 2**:
-        ```json
-        {"0": "El cielo es ", "1": "azul", "2": ".", "3": " El agua es ", "4": "esencial", "5": " para ", "6": "la vida", "7": "."}
-        ```
-        **Input 3**:
-        - Source language: English
-        - Target language: French
-        - JSON file:
-        ```json
-        {"0": "The quick brown ", "1": "fox ", "2": "jumps ", "3": "over ", "4": "the ", "5": "lazy ", "6": "dog", "7": "."}
-        ```
-        **Output 3**:
-        ```json
-        {"0": "Le renard brun ", "1": "rapide ", "2": "saute ", "3": "par-dessus ", "4": "le ", "5": "chien ", "6": "paresseux", "7": "."}
-        ```
-        Perform the translation and return the result as specified above. Do not include any additional text other than the translated JSON object.
     """
     json_data = json.dumps({i: t for i, t in enumerate(texts)})
     user_prompt = f"Source language: {source_lang}. Target language: {target_lang}. JSON file: {json_data}"
     model = genai.GenerativeModel('gemini-2.0-flash')
     response = model.generate_content(contents = system_prompt.strip() + "\n" + user_prompt.strip(), generation_config={
-            'temperature': 1,  # Adjust temperature for desired creativity
             'top_p': 1,
             'top_k': 1,})
     # response_dict = ast.literal_eval(response.text.strip().strip("json```").strip("```").strip().strip("\""))

     if not texts:
         return texts  # Skip if empty
+    system_prompt = f"""Translate the string values within the following JSON object .
+        Follow these instructions carefully:
+        1.  Analyze the entire JSON object to understand the context.
+        2.  Translate *only* the string values.
+        3.  Keep the original keys *exactly* as they are.
+        4.  Do *not* translate non-string values (like hex color codes, numbers, or potentially proper nouns like 'CALISTOGA', 'DM SANS', 'Pexels', 'Pixabay' unless they have a common translation). Use your best judgment for proper nouns.
+        5.  Preserve the original JSON structure perfectly.
+        6.  Your output *must* be only the translated JSON object, without any introductory text, explanations, or markdown formatting like ```json ... ```.
     """
     json_data = json.dumps({i: t for i, t in enumerate(texts)})
     user_prompt = f"Source language: {source_lang}. Target language: {target_lang}. JSON file: {json_data}"
     model = genai.GenerativeModel('gemini-2.0-flash')
     response = model.generate_content(contents = system_prompt.strip() + "\n" + user_prompt.strip(), generation_config={
+            'temperature': 0.3,  # Adjust temperature for desired creativity
             'top_p': 1,
             'top_k': 1,})
     # response_dict = ast.literal_eval(response.text.strip().strip("json```").strip("```").strip().strip("\""))