소스 검색

支持 gpt 批量修改翻译

gavin.chen 1 년 전
부모
커밋
32e36d8eed
4개의 변경된 파일129개의 추가작업 그리고 1개의 파일을 삭제
  1. 3 1
      .gitignore
  2. 38 0
      tools/JSON2MD.md
  3. 74 0
      tools/chat_gpt_process.md
  4. 14 0
      tools/prompt.md

+ 3 - 1
.gitignore

@@ -76,4 +76,6 @@ build/
 /pubspec.lock
 /py_generator/*
 
-*.xlsx
+*.xlsx
+gpt-outputs/*
+md-outputs/*

+ 38 - 0
tools/JSON2MD.md

@@ -0,0 +1,38 @@
+import json
+import os
+
+# 读取JSON数据
+with open("assets\zh_CN.json", "r", encoding="utf-8") as zh_file:
+    zh_data = json.load(zh_file)
+
+with open("assets\en_US.json", "r", encoding="utf-8") as en_file:
+    en_data = json.load(en_file)
+
+# 检查并创建md-outputs文件夹
+output_folder = "md-outputs"
+if not os.path.exists(output_folder):
+    os.makedirs(output_folder)
+    
+# 处理各个模块
+for module_name in zh_data.keys():
+    # 跳过locale字段
+    if module_name == "locale":
+        continue
+
+    # 提取翻译词条
+    translations = []
+    for key in zh_data[module_name].keys():
+        translations.append((key, zh_data[module_name][key], en_data[module_name][key]))
+
+    # 将翻译词条整理成Markdown格式
+    md_lines = ["| 词条 | 中文 | 英文 |", "| --- | --- | --- |"]
+
+    for translation in translations:
+        md_line = f"| {translation[0]} | {translation[1]} | {translation[2]} |"
+        md_lines.append(md_line)
+
+    md_content = "\n".join(md_lines)
+
+    # 输出结果到对应的Markdown文件
+    with open(os.path.join(output_folder, f"{module_name}-output.md"), "w", encoding="utf-8") as md_file:
+        md_file.write(md_content)

+ 74 - 0
tools/chat_gpt_process.md

@@ -0,0 +1,74 @@
+import os
+import openai
+import json
+import time
+
+def chat_gpt_runner(input_text):
+    try:
+        # 1. Read API key from environment variable
+        api_key = os.getenv("OPENAI_API_KEY")
+
+        # Print the first five lines of input_text
+        print("Input:\n" + "\n".join(input_text.splitlines()[:1]) + "...\n")
+
+        # 2. Set up OpenAI client
+        openai.api_key = api_key
+
+        response = openai.ChatCompletion.create(
+            model="gpt-3.5-turbo",
+            messages=[{"role": "user", "content": input_text}],
+            temperature=1.0,
+        )
+
+        output_text = response.choices[0].message.content
+
+        # Print the first three lines of output_text
+        print("Output:\n" + "\n".join(output_text.splitlines()[:3]) + "...\n")
+        
+        return output_text
+    except Exception as e:
+        print(f"Error: {e}")
+        return None
+
+def read_prompt(prompt_path):
+    with open(prompt_path, 'r', encoding="utf-8") as prompt_file:
+        return prompt_file.read()
+
+def read_write_md_files(input_path, output_path, prompt):
+    start_time = time.time()
+    for file in os.listdir(input_path):
+        if file.endswith(".md"):
+            with open(os.path.join(input_path, file), 'r', encoding="utf-8") as input_file:
+                lines = input_file.readlines()[2:]
+                output_filename = file.replace("-output", "-gpt-output")
+                output_filepath = os.path.join(output_path, output_filename)
+                
+                with open(output_filepath, 'w', encoding="utf-8") as output_file:
+                    for i in range(0, len(lines), 50):
+                        chunk = lines[i:i+50]
+                        single_start_time = time.time()
+                        result = chat_gpt_runner(prompt+"".join(chunk))
+                        output_file.write(result)
+                        output_file.write("\n\n")
+                        single_end_time = time.time()
+                        elapsed_single_time = single_end_time - single_start_time
+                        elapsed_total_time = single_end_time - start_time
+                        
+                        print(f"单次用时: {elapsed_single_time:.4f} 秒")
+                        print(f"当前总耗时: {elapsed_total_time:.4f} 秒")
+
+if __name__ == "__main__":
+    root_path = os.getcwd()
+    input_folder = "md-outputs"
+    output_folder = "gpt-outputs"
+    prompt_path = "tools\prompt.md"
+
+    input_path = os.path.join(root_path, input_folder)
+    output_path = os.path.join(root_path, output_folder)
+
+    if not os.path.exists(output_path):
+        os.makedirs(output_path)
+    
+    prompt_content = read_prompt(os.path.join(root_path, prompt_path))
+
+    read_write_md_files(input_path, output_path, prompt_content)

+ 14 - 0
tools/prompt.md

@@ -0,0 +1,14 @@
+假设你拥有gpt-4的能力,请你假设自己是一个地道的英语母语者,资深产品经理,资深翻译官,下面有一份医疗软件UI的i18n中英对照表格,帮我找出其中翻译不得当,不恰当,不合理的内容,给出不合理的理由,并给出合理的翻译,以md表格的形式回复我:
+回复格式:
+| 词条 | 中文 | 英文 | 优化后 |
+| --- | --- | --- | --- |
+...
+
+理由:  
+
+1. xxx  
+2. xxx  
+
+中英对照表格:
+| 词条 | 中文 | 英文 |
+| --- | --- | --- |