Files
d365scm/translate_all.py
2026-03-21 09:12:47 +08:00

117 lines
3.5 KiB
Python

#!/usr/bin/env python3
"""
自动翻译所有题目
"""
import json
import os
import time
import urllib.request
import ssl
API_KEY = "sk-74905419d30541d18991396892bb27b0"
API_URL = "https://dashscope.aliyuncs.com/api/v1/services/aigc/text-generation/generation"
def translate_text(text):
"""
使用阿里百炼API翻译文本
"""
if not text or not text.strip():
return text
prompt = f"""请将以下英文翻译成中文,保持专业术语的准确性,直接输出翻译结果,不要添加任何解释:
英文原文:
{text}
中文翻译:"""
try:
headers = {
'Content-Type': 'application/json',
'Authorization': f'Bearer {API_KEY}'
}
data = {
"model": "qwen-turbo",
"input": {
"messages": [
{
"role": "user",
"content": prompt
}
]
},
"parameters": {
"temperature": 0.1,
"max_tokens": 2000
}
}
req = urllib.request.Request(
API_URL,
data=json.dumps(data).encode('utf-8'),
headers=headers,
method='POST'
)
ssl_context = ssl.create_default_context()
with urllib.request.urlopen(req, context=ssl_context, timeout=60) as response:
result = json.loads(response.read().decode('utf-8'))
if result and 'output' in result and 'text' in result['output']:
translated = result['output']['text'].strip()
if translated.startswith('中文翻译:'):
translated = translated[6:].strip()
return translated
else:
print(f"API响应格式错误: {result}")
return text
except Exception as e:
print(f"翻译错误: {e}")
return text
def translate_all_questions(input_file, output_file):
"""
翻译所有题目
"""
if os.path.exists(output_file):
with open(output_file, 'r', encoding='utf-8') as f:
questions = json.load(f)
else:
with open(input_file, 'r', encoding='utf-8') as f:
questions = json.load(f)
total = len(questions)
for i, q in enumerate(questions):
print(f"翻译 Topic {q['topic']} - Question {q['question_num']} ({i+1}/{total})")
need_save = False
if 'stem_cn' not in q or not q['stem_cn'] or q['stem_cn'] == '待翻译...':
print(f" 翻译题干...")
q['stem_cn'] = translate_text(q['stem'])
need_save = True
time.sleep(0.3)
for opt in q['options']:
if 'text_cn' not in opt or not opt['text_cn'] or opt['text_cn'] == '待翻译...':
print(f" 翻译选项 {opt['label']}...")
opt['text_cn'] = translate_text(opt['text'])
need_save = True
time.sleep(0.2)
if need_save:
with open(output_file, 'w', encoding='utf-8') as f:
json.dump(questions, f, ensure_ascii=False, indent=2)
print(f"\n所有 {total} 道题目翻译完成!")
if __name__ == '__main__':
input_file = '/Users/duguoyou/D365/exam_data/questions.json'
output_file = '/Users/duguoyou/D365/exam_data/questions_translated.json'
translate_all_questions(input_file, output_file)