diff --git a/docutranslate/app.py b/docutranslate/app.py index ead3427..6e591f7 100644 --- a/docutranslate/app.py +++ b/docutranslate/app.py @@ -113,6 +113,7 @@ def _create_default_task_state() -> Dict[str, Any]: "original_filename": None, "temp_dir": None, # 用于存储临时文件的目录 "downloadable_files": {}, # 存储可下载文件的路径和名称 + "attachment_files": {}, # 存储附件文件的路径和标识符 } @@ -202,9 +203,10 @@ DocuTranslate 后端服务 API,提供文档翻译、状态查询、结果下 2. **`GET /service/status/{{task_id}}`**: 使用获取到的 `task_id` 轮询此端点,获取任务的实时状态。 3. **`GET /service/logs/{{task_id}}`**: (可选) 获取实时的翻译日志。 4. **`GET /service/download/{{task_id}}/{{file_type}}`**: 任务完成后 (当 `download_ready` 为 `true` 时),通过此端点下载结果文件。 -5. **`GET /service/content/{{task_id}}/{{file_type}}`**: 任务完成后(当 `download_ready` 为 `true` 时),以JSON格式获取文件内容。 -6. **`POST /service/cancel/{{task_id}}`**: (可选) 取消一个正在进行的任务。 -7. **`POST /service/release/{{task_id}}`**: (可选) 当任务不再需要时,释放其在服务器上占用的所有资源,包括临时文件。 +5. **`GET /service/attachment/{{task_id}}/{{identifier}}`**: (可选) 如果任务生成了附件(如术语表),通过此端点下载。 +6. **`GET /service/content/{{task_id}}/{{file_type}}`**: 任务完成后(当 `download_ready` 为 `true` 时),以JSON格式获取文件内容。 +7. **`POST /service/cancel/{{task_id}}`**: (可选) 取消一个正在进行的任务。 +8. **`POST /service/release/{{task_id}}`**: (可选) 当任务不再需要时,释放其在服务器上占用的所有资源,包括临时文件。 **版本**: {__version__} """, @@ -795,6 +797,23 @@ async def _perform_translation( except Exception as export_error: task_logger.error(f"生成 {file_type} 文件时出错: {export_error}", exc_info=True) + # 处理附件文件 + attachment_files = {} + attachment_object = workflow.get_attachment() + if attachment_object and attachment_object.attachment_dict: + task_logger.info(f"发现 {len(attachment_object.attachment_dict)} 个附件,正在处理...") + for identifier, doc in attachment_object.attachment_dict.items(): + try: + # 'doc' is a Document object + attachment_filename = f"{doc.stem or identifier}.{doc.suffix}" + attachment_path = os.path.join(temp_dir, attachment_filename) + with open(attachment_path, "wb") as f: + f.write(doc.content) + attachment_files[identifier] = {"path": attachment_path, "filename": attachment_filename} + task_logger.info(f"成功生成附件 '{identifier}' 文件: {attachment_filename}") + except Exception as attachment_error: + task_logger.error(f"生成附件 '{identifier}' 文件时出错: {attachment_error}", exc_info=True) + # 5. 任务成功,更新最终状态 end_time = time.time() duration = end_time - task_state["task_start_time"] @@ -804,6 +823,7 @@ async def _perform_translation( "error_flag": False, "task_end_time": end_time, "downloadable_files": downloadable_files, + "attachment_files": attachment_files, }) task_logger.info(f"翻译成功完成,用时 {duration:.2f} 秒。") @@ -867,7 +887,7 @@ async def _start_translation_task( "original_filename_stem": Path(original_filename).stem, "original_filename": original_filename, "task_start_time": time.time(), "task_end_time": 0, "current_task_ref": None, - "temp_dir": None, "downloadable_files": {}, + "temp_dir": None, "downloadable_files": {}, "attachment_files": {}, }) log_history = tasks_log_histories[task_id] @@ -1014,7 +1034,7 @@ async def service_release_task(task_id: str): @service_router.get( "/status/{task_id}", summary="获取任务状态", - description="根据任务ID获取任务的当前状态。当 `download_ready` 为 `true` 时,`downloads` 对象中会包含可用的下载链接。", + description="根据任务ID获取任务的当前状态。当 `download_ready` 为 `true` 时,`downloads` 和 `attachment` 对象中会包含可用的下载链接。", responses={ 200: { "description": "成功获取任务状态。", @@ -1028,7 +1048,7 @@ async def service_release_task(task_id: str): "status_message": "正在处理 'annual_report.pdf'...", "error_flag": False, "download_ready": False, "original_filename_stem": "annual_report", "original_filename": "annual_report.pdf", "task_start_time": 1678889400.0, - "task_end_time": 0, "downloads": {} + "task_end_time": 0, "downloads": {}, "attachment": {} } }, "completed_markdown": { @@ -1043,6 +1063,26 @@ async def service_release_task(task_id: str): "html": "/service/download/b2865b93/html", "markdown": "/service/download/b2865b93/markdown", "markdown_zip": "/service/download/b2865b93/markdown_zip" + }, + "attachment": {} + } + }, + "completed_with_attachment": { + "summary": "已完成 (带附件)", + "value": { + "task_id": "g1h2i3j4", "is_processing": False, + "status_message": "翻译成功!用时 125.00 秒。", + "error_flag": False, "download_ready": True, + "original_filename_stem": "complex_document", + "original_filename": "complex_document.docx", + "task_start_time": 1678891000.0, + "task_end_time": 1678891125.0, + "downloads": { + "docx": "/service/download/g1h2i3j4/docx", + "html": "/service/download/g1h2i3j4/html" + }, + "attachment": { + "glossary": "/service/attachment/g1h2i3j4/glossary" } } }, @@ -1062,7 +1102,8 @@ async def service_release_task(task_id: str): "xlsx": "/service/download/d7e8f9a0/xlsx", "csv": "/service/download/d7e8f9a0/csv", "html": "/service/download/d7e8f9a0/html" - } + }, + "attachment": {} } }, "completed_docx": { @@ -1076,7 +1117,8 @@ async def service_release_task(task_id: str): "downloads": { "docx": "/service/download/f8a9c1b2/docx", "html": "/service/download/f8a9c1b2/html" - } + }, + "attachment": {} } }, "completed_epub": { @@ -1090,7 +1132,8 @@ async def service_release_task(task_id: str): "downloads": { "epub": "/service/download/e9b8d7c6/epub", "html": "/service/download/e9b8d7c6/html" - } + }, + "attachment": {} } }, # --- HTML STATUS EXAMPLE START --- @@ -1104,7 +1147,8 @@ async def service_release_task(task_id: str): "task_end_time": 1678890115.78, "downloads": { "html": "/service/download/a1b2c3d4/html" - } + }, + "attachment": {} } }, # --- HTML STATUS EXAMPLE END --- @@ -1115,7 +1159,7 @@ async def service_release_task(task_id: str): "status_message": "翻译过程中发生错误: LLM API key is invalid", "error_flag": True, "download_ready": False, "original_filename_stem": "bad_config", "original_filename": "bad_config.json", "task_start_time": 1678889600.0, - "task_end_time": 1678889610.0, "downloads": {} + "task_end_time": 1678889610.0, "downloads": {}, "attachment": {} } } } @@ -1136,6 +1180,11 @@ async def service_get_status( for file_type in task_state["downloadable_files"].keys(): downloads[file_type] = f"/service/download/{task_id}/{file_type}" + attachments = {} + if task_state.get("download_ready") and task_state.get("attachment_files"): + for identifier in task_state["attachment_files"].keys(): + attachments[identifier] = f"/service/attachment/{task_id}/{identifier}" + return JSONResponse(content={ "task_id": task_id, "is_processing": task_state["is_processing"], @@ -1146,7 +1195,8 @@ async def service_get_status( "original_filename": task_state.get("original_filename"), "task_start_time": task_state["task_start_time"], "task_end_time": task_state["task_end_time"], - "downloads": downloads + "downloads": downloads, + "attachment": attachments }) @@ -1218,6 +1268,42 @@ async def service_download_file( return FileResponse(path=file_path, media_type=media_type, filename=filename) +@service_router.get( + "/attachment/{task_id}/{identifier}", + summary="下载附件文件", + description="根据任务ID和附件标识符下载在翻译过程中生成的附加文件,例如自动生成的术语表。", + responses={ + 200: { + "description": "成功返回文件流。文件名通过 Content-Disposition 头指定。", + "content": { + "application/octet-stream": {"schema": {"type": "string", "format": "binary"}}, + } + }, + 404: {"description": "任务ID不存在,或该任务没有指定的附件,或临时文件已丢失。"}, + } +) +async def service_download_attachment( + task_id: str = FastApiPath(..., description="已完成任务的ID", examples=["g1h2i3j4"]), + identifier: str = FastApiPath(..., description="要下载的附件的标识符。", examples=["glossary"]) +): + task_state = tasks_state.get(task_id) + if not task_state: + raise HTTPException(status_code=404, detail=f"找不到任务ID '{task_id}'。") + + attachment_info = task_state.get("attachment_files", {}).get(identifier) + if not attachment_info or not os.path.exists(attachment_info.get("path")): + raise HTTPException(status_code=404, + detail=f"任务 '{task_id}' 不存在标识符为 '{identifier}' 的附件,或文件已丢失。") + + file_path = attachment_info["path"] + filename = attachment_info["filename"] + + # Use a generic media type as attachments can be of various formats + media_type = "application/octet-stream" + + return FileResponse(path=file_path, media_type=media_type, filename=filename) + + @service_router.get( "/content/{task_id}/{file_type}", summary="下载翻译结果内容 (JSON)", diff --git a/docutranslate/static/i18nData.json b/docutranslate/static/i18nData.json index 3f361c3..e81ebf2 100644 --- a/docutranslate/static/i18nData.json +++ b/docutranslate/static/i18nData.json @@ -18,23 +18,18 @@ "insertModeAppend": "附加到原文后 (Append)", "insertModePrepend": "附加到原文前 (Prepend)", "insertModeHelpDocx": "选择如何将翻译后的文本插入。", + "separatorLabel": "分隔符", + "separatorHelp": "当插入模式为附加或前置时,用于分隔原文和译文的字符。\\n 代表换行。", "insertModeHelpXlsx": "选择如何将翻译后的文本插入到单元格中。", + "xlsxTranslateRegionsLabel": "翻译区域 (可选)", "insertModeHelpSrt": "选择如何将翻译后的文本插入。", "insertModeHelpEpub": "选择如何将翻译后的文本插入。", "insertModeHelpHtml": "选择如何将翻译后的文本插入。", - "separatorLabel": "分隔符", - "separatorPlaceholder": "例如: \\n---翻译---\\n", - "separatorPlaceholderSimple": "例如: \\n---\\n", - "separatorHelp": "当插入模式为附加或前置时,用于分隔原文和译文的字符。\\n 代表换行。", - "xlsxTranslateRegionsLabel": "翻译区域 (可选)", - "xlsxTranslateRegionsPlaceholder": "每行一个区域, 例如:Sheet1!A1:B10(不指定表名则对所有表生效)", "jsonPathLabel": "需要翻译的JSON路径", - "jsonPathPlaceholder": "每行一个路径, 例如:\n$.name\n$.*", "jsonPathHelp": "采用jsonpath-ng的路径选择语法,每一行表示一个json路径", "parsingEngineLabel": "解析引擎", "parsingEngineHelp": "如果上传的文件本身是.md格式,此项可不选。", "getMineruTokenTitle": "获取Mineru Token", - "mineruTokenPlaceholder": "使用Mineru引擎时需要", "modelVersionLabel": "Mineru 模型版本", "modelVersionVlm": "VLM", "modelVersionPipline": "Pipeline", @@ -44,33 +39,28 @@ "platformLabel": "选择平台", "platformCustom": "自定义接口", "baseUrlLabel": "API 地址 (Base URL)", - "baseUrlPlaceholder": "OpenAi兼容地址", "getApiKeyTitle": "获取API Key", - "apiKeyPlaceholder": "请输入您的API Key", "modelIdLabel": "模型 ID", - "modelIdPlaceholder": "例如: gpt-4o, glm-4", "targetLanguageLabel": "目标语言", "targetLanguageCustom": "其它 (自定义)", - "customLangPlaceholder": "请输入目标语言, 例如: Italian", "thinkingModeLabel": "思考模式", "thinkingModeTooltip": "设置混合推理模型的思考模式,目前支持智谱平台的glm-4.5系列、阿里云的qwen3系列、火山引擎的Doubao-Seed-1.6系列等", "thinkingModeEnable": "启用", "thinkingModeDisable": "禁用", "thinkingModeDefault": "默认", "customPromptLabel": "自定义Prompt", - "customPromptPlaceholder": "可选,如“人名保持原文不翻译”", + "chunkSizeLabel": "分块大小", + "resetBtn": "重置", + "concurrentLabel": "并发数", + "glossaryGenTitle": "5. 术语表", "glossaryLabel": "术语表 (可选)", "glossaryHelp": "选择一个或多个CSV文件。文件需包含'src'和'dst'两列标题,分别代表原文和译文。", "viewGlossaryBtn": "查看术语表", "clearGlossaryBtn": "清空", - "glossaryGenTitle": "术语表", "glossaryGenEnableLabel": "自动生成术语表", "glossaryGenConfigLabel": "生成术语表配置", "glossaryGenConfigSame": "与翻译配置相同", "glossaryGenConfigCustom": "自定义", - "resetBtn": "重置", - "chunkSizeLabel": "分块大小", - "concurrentLabel": "并发数", "githubInfo": "GitHub主页(欢迎star❤):
https://github.com/xunbu/docutranslate", "qqGroupInfo": "交流QQ群: 1047781902", "taskListTitle": "任务列表", @@ -80,11 +70,12 @@ "taskCardIdPlaceholder": "等待提交...", "taskCardFileDrop": "点击或拖拽文件到此处", "taskCardFileSelected": "文件已选择", - "taskCardFilenameLabel": "文件名:", + "taskCardFilenameLabel": "文件名: ", "taskCardLogLabel": "日志", "taskCardStatusWaiting": "等待上传文件...", "taskCardPreviewBtn": "预览", "taskCardDownloadBtn": "下载", + "taskCardAttachmentBtn": "附件", "taskCardStartBtn": "开始翻译", "downloadMdEmbedded": "Markdown(嵌图)", "downloadMdZip": "Markdown压缩包", @@ -96,7 +87,7 @@ "closeBtn": "关闭", "downloadBtn": "下载", "tutorialModalTitle": "使用教程", - "tutorialModalBody": "

视频教程可以在B站搜索 docutranslate 获取。

欢迎使用 DocuTranslate!请按照以下步骤完成文档翻译:

  1. 选择工作流

    首先,在配置面板顶部选择您需要的翻译流程。不同的工作流适用于不同类型的文件:

    新增功能: \"自动选择工作流\"开关已默认开启。您只需上传文件,系统会自动为您匹配合适的工作流,简化操作。

  2. 配置参数

    根据您选择的工作流,完成相应的配置。所有配置项都会自动保存在您的浏览器中。

  3. 上传文件

    在右侧的任务列表中,点击或拖拽您的文档到文件上传区域。

  4. 开始翻译

    文件选择成功后,点击任务卡片右下角的 开始翻译 按钮。系统将开始处理任务,您可以在日志区域查看实时进度。

  5. 查看与下载

    翻译完成后,任务卡片下方会出现操作按钮:

提示: 所有配置都会自动保存在您的浏览器本地,方便下次使用。
", + "tutorialModalBody": "

视频教程可以在B站搜索 docutranslate 获取。

欢迎使用 DocuTranslate!请按照以下步骤完成文档翻译:

  1. 选择工作流

    首先,在配置面板顶部选择您需要的翻译流程。不同的工作流适用于不同类型的文件:

    新增功能: \"自动选择工作流\"开关已默认开启。您只需上传文件,系统会自动为您匹配合适的工作流,简化操作。
  2. 配置参数

    根据您选择的工作流,完成相应的配置。所有配置项都会自动保存在您的浏览器中。

  3. 上传文件

    在右侧的任务列表中,点击或拖拽您的文档到文件上传区域。

  4. 开始翻译

    文件选择成功后,点击任务卡片右下角的 开始翻译 按钮。系统将开始处理任务,您可以在日志区域查看实时进度。

  5. 查看与下载

    翻译完成后,任务卡片下方会出现操作按钮:

提示: 所有配置都会自动保存在您的浏览器本地,方便下次使用。
", "tutorialUnderstandBtn": "我明白了", "contributorsModalTitle": "感谢贡献", "contributorsPara1": "DocuTranslate是一个开源项目!大家的需求与使用是项目进步的动力。", @@ -109,6 +100,16 @@ "glossaryModalTitle": "当前术语表", "glossaryTableSource": "原文 (src)", "glossaryTableDestination": "译文 (dst)", + "separatorPlaceholder": "例如: \\n---翻译---\\n", + "separatorPlaceholderSimple": "例如: \\n---\\n", + "xlsxTranslateRegionsPlaceholder": "每行一个区域, 例如:Sheet1!A1:B10(不指定表名则对所有表生效)", + "jsonPathPlaceholder": "每行一个路径, 例如:\n$.name\n$.*", + "mineruTokenPlaceholder": "使用Mineru引擎时需要", + "baseUrlPlaceholder": "OpenAi兼容地址", + "apiKeyPlaceholder": "请输入您的API Key", + "modelIdPlaceholder": "例如: gpt-4o, glm-4", + "customLangPlaceholder": "请输入目标语言, 例如: Italian", + "customPromptPlaceholder": "可选,如“人名保持原文不翻译”", "init_i18n_failed_alert": "加载界面翻译资源失败,请检查网络连接或联系管理员。", "init_failed_alert": "初始化失败,无法连接到后端服务。请检查服务是否运行或刷新页面。", "glossaryEmpty": "术语表为空。", @@ -121,44 +122,43 @@ "htmlSettingsTitleText": "HTML翻译选项", "aiSettingsTitleText": "翻译模型", "translationSettingsTitleText": "翻译配置", - "advancedSettingsTitleText": "高级参数", - "engineOptionIdentity": "不转换(Identity)", + "engineOptionIdentity": "默认", "engineOptionMineru": "Mineru", "engineOptionDocling": "Docling", "status_selectFileFirst": "请先选择文件!", "status_fillRequired": "请填写所有必填项!", - "status_invalidWorkflow": "选择了无效的工作流。", + "status_invalidWorkflow": "选择了无效的工作流", "status_releasingOldTask": "正在释放旧任务资源...", - "btn_initializing": "初始化...", - "status_encodingAndSubmitting": "正在编码文件并提交任务...", + "btn_initializing": "初始化中...", + "status_encodingAndSubmitting": "文件编码并提交中...", "status_requestOk": "任务请求成功,等待处理...", "btn_cancelTranslation": "取消翻译", "status_requestFail": "请求失败", "status_initFail": "任务启动失败", "status_cancelling": "取消中...", - "status_cancelSent": "取消请求已发送。", + "status_cancelSent": "取消请求已发送", "status_cancelFail": "取消失败", - "status_gettingStatus": "正在获取状态...", + "admin_tasklist_failed": "管理员模式:加载任务列表失败。", + "status_gettingStatus": "获取状态中...", "btn_reTranslate": "重新翻译", - "status_updateError": "状态更新失败。", - "preview_loading": "正在加载预览...", + "status_updateError": "状态更新失败,请检查网络", + "preview_loading": "加载预览中...", "preview_cantReadOriginal": "无法读取原文内容。", "preview_cantPreviewType": "无法预览此文件类型", "preview_noOriginalCache": "无原文缓存,请重新上传文件以预览。", - "preview_loadFailed": "加载预览失败。", - "pdf_preparing": "正在准备PDF...", - "pdf_print_failed": "打印/另存为PDF失败。可能是浏览器限制或预览内容问题。", - "pdf_fetch_failed": "获取预览内容失败,无法生成PDF。", - "preview_bilingual": "双语预览", - "preview_translatedOnly": "仅译文预览", - "admin_tasklist_failed": "管理员模式:无法从服务器加载任务列表。" + "preview_loadFailed": "加载预览失败", + "pdf_preparing": "正在准备PDF,请稍候...", + "pdf_print_failed": "调用打印功能失败,请尝试手动保存为PDF。", + "pdf_fetch_failed": "获取HTML内容失败,无法生成PDF。", + "preview_bilingual": "双语对照预览", + "preview_translatedOnly": "仅译文预览" }, "en": { "pageTitle": "DocuTranslate - Interactive Document Translation", "tutorialBtn": "Tutorial", - "projectContributeBtn": "Contribute", + "projectContributeBtn": "Collaborate", "workflowTitle": "1. Select Workflow", - "workflowOptionMarkdown": "Translate via Markdown (.pdf/.md/.png, etc.)", + "workflowOptionMarkdown": "Markdown-based Translation (.pdf/.md/.png, etc.)", "workflowOptionTxt": "Plain Text Translation (.txt)", "workflowOptionJson": "JSON Translation (.json)", "workflowOptionDocx": "DOCX Translation (.docx)", @@ -171,101 +171,102 @@ "insertModeReplace": "Replace Original", "insertModeAppend": "Append to Original", "insertModePrepend": "Prepend to Original", - "insertModeHelpDocx": "Choose how the translated text is inserted.", - "insertModeHelpXlsx": "Choose how the translated text is inserted into cells.", - "insertModeHelpSrt": "Choose how the translated text is inserted.", - "insertModeHelpEpub": "Choose how the translated text is inserted.", - "insertModeHelpHtml": "Choose how the translated text is inserted.", + "insertModeHelpDocx": "Choose how to insert the translated text.", "separatorLabel": "Separator", - "separatorPlaceholder": "e.g., \\n---Translation---\\n", - "separatorPlaceholderSimple": "e.g., \\n---\\n", - "separatorHelp": "Characters used to separate original and translated text in 'Append' or 'Prepend' mode. \\n represents a newline.", - "xlsxTranslateRegionsLabel": "Translate Regions (Optional)", - "xlsxTranslateRegionsPlaceholder": "One region per line, e.g., Sheet1!A1:B10 (applies to all sheets if sheet name is omitted)", + "separatorHelp": "Separator character used between original and translated text when in Append or Prepend mode. \\n represents a newline.", + "insertModeHelpXlsx": "Choose how to insert translated text into cells.", + "xlsxTranslateRegionsLabel": "Translation Regions (Optional)", + "insertModeHelpSrt": "Choose how to insert the translated text.", + "insertModeHelpEpub": "Choose how to insert the translated text.", + "insertModeHelpHtml": "Choose how to insert the translated text.", "jsonPathLabel": "JSON Paths to Translate", - "jsonPathPlaceholder": "One path per line, e.g.:\n$.name\n$.*", - "jsonPathHelp": "Uses jsonpath-ng syntax. Each line represents a JSON path.", + "jsonPathHelp": "Uses jsonpath-ng syntax. Enter one JSON path per line.", "parsingEngineLabel": "Parsing Engine", - "parsingEngineHelp": "If the uploaded file is already in .md format, this can be left unselected.", + "parsingEngineHelp": "Not required if the uploaded file is already in .md format.", "getMineruTokenTitle": "Get Mineru Token", - "mineruTokenPlaceholder": "Required when using the Mineru engine", "modelVersionLabel": "Mineru Model Version", "modelVersionVlm": "VLM", "modelVersionPipline": "Pipeline", - "modelVersionHelp": "Mineru VLM is a newer, internal beta model.", + "modelVersionHelp": "Mineru VLM is a newer model in beta.", "formulaOcrLabel": "Formula Recognition", "codeOcrLabel": "Code Recognition", "platformLabel": "Select Platform", "platformCustom": "Custom Endpoint", - "baseUrlLabel": "API Base URL", - "baseUrlPlaceholder": "OpenAI-compatible URL", + "baseUrlLabel": "API Address (Base URL)", "getApiKeyTitle": "Get API Key", - "apiKeyPlaceholder": "Please enter your API Key", "modelIdLabel": "Model ID", - "modelIdPlaceholder": "e.g., gpt-4o, llama-3-70b", "targetLanguageLabel": "Target Language", "targetLanguageCustom": "Other (Custom)", - "customLangPlaceholder": "Enter target language, e.g., Italian", "thinkingModeLabel": "Thinking Mode", - "thinkingModeTooltip": "Sets the thinking mode for hybrid inference models, currently supporting Zhipu's glm-4.5 series, Alibaba Cloud's qwen3 series, Volcengine's Doubao-Seed-1.6 series, etc.", + "thinkingModeTooltip": "Set the thinking mode for mixed-inference models. Currently supports Zhipu's glm-4.5 series, Alibaba's qwen3 series, Volcengine's Doubao-Seed-1.6 series, etc.", "thinkingModeEnable": "Enable", "thinkingModeDisable": "Disable", "thinkingModeDefault": "Default", "customPromptLabel": "Custom Prompt", - "customPromptPlaceholder": "Optional, e.g., 'Do not translate proper names'", + "chunkSizeLabel": "Chunk Size", + "resetBtn": "Reset", + "concurrentLabel": "Concurrency", + "glossaryGenTitle": "5. Glossary", "glossaryLabel": "Glossary (Optional)", - "glossaryHelp": "Select one or more CSV files. Files must contain 'src' and 'dst' headers for source and destination terms.", + "glossaryHelp": "Select one or more CSV files. Files must have 'src' and 'dst' headers, representing source and destination text respectively.", "viewGlossaryBtn": "View Glossary", "clearGlossaryBtn": "Clear", - "glossaryGenTitle": "Glossary", "glossaryGenEnableLabel": "Auto-generate Glossary", "glossaryGenConfigLabel": "Glossary Generation Config", - "glossaryGenConfigSame": "Same as Translator", + "glossaryGenConfigSame": "Same as Translation Config", "glossaryGenConfigCustom": "Custom", - "resetBtn": "Reset", - "chunkSizeLabel": "Chunk Size", - "concurrentLabel": "Concurrency", - "githubInfo": "GitHub Repo (Star us! ❤):
https://github.com/xunbu/docutranslate", - "qqGroupInfo": "QQ Group for discussions: 1047781902", + "githubInfo": "GitHub (Star us! ❤):
https://github.com/xunbu/docutranslate", + "qqGroupInfo": "QQ Group: 1047781902", "taskListTitle": "Task List", "newTaskBtn": "New Task", - "noTaskPlaceholder": "No tasks yet. Click 'New Task' to get started!", + "noTaskPlaceholder": "No tasks yet. Click \"New Task\" to get started!", "taskCardIdLabel": "Task ID", "taskCardIdPlaceholder": "Awaiting submission...", "taskCardFileDrop": "Click or drag file here", "taskCardFileSelected": "File selected", - "taskCardFilenameLabel": "Filename:", + "taskCardFilenameLabel": "Filename: ", "taskCardLogLabel": "Log", "taskCardStatusWaiting": "Waiting for file upload...", "taskCardPreviewBtn": "Preview", "taskCardDownloadBtn": "Download", + "taskCardAttachmentBtn": "Attachments", "taskCardStartBtn": "Start Translation", - "downloadMdEmbedded": "Markdown (Embedded Imgs)", - "downloadMdZip": "Markdown (.zip)", + "downloadMdEmbedded": "Markdown (Embedded)", + "downloadMdZip": "Markdown (Zip)", "previewTitle": "Preview", "previewBilingualBtn": "Bilingual", "previewTranslatedOnlyBtn": "Translated Only", "previewOriginal": "Original", - "previewTranslated": "Translated", + "previewTranslated": "Translation", "closeBtn": "Close", "downloadBtn": "Download", - "tutorialModalTitle": "User Guide", - "tutorialModalBody": "

Video tutorials are available on Bilibili by searching for docutranslate.

Welcome to DocuTranslate! Follow these steps to translate your documents:

  1. Select Workflow

    First, choose your desired translation process from the top of the settings panel. Different workflows are suited for different file types:

    New Feature: The 'Auto-select workflow' switch is now on by default. Just upload your file, and the system will automatically match it to the appropriate workflow for you.

  2. Configure Parameters

    Configure the settings based on your chosen workflow. All settings are automatically saved in your browser.

  3. Upload File

    In the task list on the right, click or drag your document into the file upload area.

  4. Start Translation

    Once the file is selected, click the Start Translation button on the task card. The system will begin processing, and you can monitor real-time progress in the log area.

  5. View & Download

    After the translation is complete, action buttons will appear on the task card:

Tip: All your settings are automatically saved in your browser's local storage for your convenience.
", - "tutorialUnderstandBtn": "I understand", - "contributorsModalTitle": "Thanks for Contributing!", - "contributorsPara1": "DocuTranslate is an open-source project! The community's needs and usage are what drive the project forward.", - "contributorsPara2": "A heartfelt thank you to everyone who has funded the project, submitted code, provided valuable suggestions, and starred the repository!", - "contributorsWelcome": "You're welcome to contribute in the following ways:", - "contributorsGithub": "GitHub Repo", - "contributorsPR": "Submit a Pull Request", - "contributorsIssue": "Report an Issue", + "tutorialModalTitle": "Tutorial", + "tutorialModalBody": "

Video tutorials are available on YouTube by searching for docutranslate.

Welcome to DocuTranslate! Follow these steps to translate your documents:

  1. Select Workflow

    First, choose the appropriate translation process from the top of the settings panel. Different workflows are suited for different file types:

    New Feature: \"Auto-select workflow\" is now enabled by default. Simply upload your file, and the system will automatically match it with the correct workflow to simplify the process.
  2. Configure Parameters

    Configure the settings based on your chosen workflow. All settings are automatically saved in your browser.

  3. Upload File

    In the task list on the right, click or drag your document into the file upload area.

  4. Start Translation

    After selecting a file, click the Start Translation button on the task card. The system will begin processing, and you can monitor the progress in the log area.

  5. View & Download

    Once the translation is complete, new buttons will appear on the task card:

Tip: All your settings are automatically saved in your browser's local storage for future use.
", + "tutorialUnderstandBtn": "I Understand", + "contributorsModalTitle": "Thanks for Contributing", + "contributorsPara1": "DocuTranslate is an open-source project! The community's needs and usage are the driving force behind its progress.", + "contributorsPara2": "Thank you to everyone who has sponsored, contributed code, offered valuable suggestions, and starred the project!", + "contributorsWelcome": "We welcome contributions in the following ways:", + "contributorsGithub": "GitHub Page", + "contributorsPR": "Submit Pull Request", + "contributorsIssue": "Report Issue", "contributorsQQ": "Or contact the author via QQ Group: 1047781902", "glossaryModalTitle": "Current Glossary", "glossaryTableSource": "Source (src)", "glossaryTableDestination": "Destination (dst)", + "separatorPlaceholder": "e.g., \\n---Translation---\\n", + "separatorPlaceholderSimple": "e.g., \\n---\\n", + "xlsxTranslateRegionsPlaceholder": "One region per line, e.g., Sheet1!A1:B10 (applies to all sheets if sheet name is omitted)", + "jsonPathPlaceholder": "One path per line, e.g.,\n$.name\n$.*", + "mineruTokenPlaceholder": "Required when using Mineru engine", + "baseUrlPlaceholder": "OpenAI-compatible address", + "apiKeyPlaceholder": "Please enter your API Key", + "modelIdPlaceholder": "e.g., gpt-4o, glm-4", + "customLangPlaceholder": "Enter target language, e.g., Italian", + "customPromptPlaceholder": "Optional, e.g., \"Keep proper names in their original language\"", "init_i18n_failed_alert": "Failed to load interface translations. Please check your network connection or contact an administrator.", "init_failed_alert": "Initialization failed, could not connect to the backend service. Please ensure the service is running and refresh the page.", - "glossaryEmpty": "The glossary is empty.", + "glossaryEmpty": "Glossary is empty.", "parsingSettingsTitleText": "Parsing Config", "jsonSettingsTitleText": "JSON Path Config", "xlsxSettingsTitleText": "XLSX Translation Options", @@ -275,36 +276,35 @@ "htmlSettingsTitleText": "HTML Translation Options", "aiSettingsTitleText": "Translation Model", "translationSettingsTitleText": "Translation Config", - "advancedSettingsTitleText": "Advanced Parameters", - "engineOptionIdentity": "No Conversion (Identity)", + "engineOptionIdentity": "Default", "engineOptionMineru": "Mineru", "engineOptionDocling": "Docling", "status_selectFileFirst": "Please select a file first!", "status_fillRequired": "Please fill in all required fields!", - "status_invalidWorkflow": "Invalid workflow selected.", + "status_invalidWorkflow": "Invalid workflow selected", "status_releasingOldTask": "Releasing old task resources...", "btn_initializing": "Initializing...", - "status_encodingAndSubmitting": "Encoding file and submitting task...", + "status_encodingAndSubmitting": "Encoding and submitting file...", "status_requestOk": "Task submitted successfully, awaiting processing...", "btn_cancelTranslation": "Cancel Translation", - "status_requestFail": "Request failed", - "status_initFail": "Failed to start task", + "status_requestFail": "Request Failed", + "status_initFail": "Task initiation failed", "status_cancelling": "Cancelling...", - "status_cancelSent": "Cancellation request sent.", + "status_cancelSent": "Cancellation request sent", "status_cancelFail": "Cancellation failed", + "admin_tasklist_failed": "Admin Mode: Failed to load task list.", "status_gettingStatus": "Getting status...", - "btn_reTranslate": "Re-translate", - "status_updateError": "Failed to update status.", + "btn_reTranslate": "Translate Again", + "status_updateError": "Status update failed, please check network", "preview_loading": "Loading preview...", - "preview_cantReadOriginal": "Could not read original file content.", + "preview_cantReadOriginal": "Could not read original content.", "preview_cantPreviewType": "Cannot preview this file type", "preview_noOriginalCache": "No original file cached. Please re-upload to preview.", - "preview_loadFailed": "Failed to load preview.", - "pdf_preparing": "Preparing PDF...", - "pdf_print_failed": "Print/Save as PDF failed. This may be due to browser restrictions or preview content issues.", - "pdf_fetch_failed": "Failed to fetch preview content, cannot generate PDF.", + "preview_loadFailed": "Failed to load preview", + "pdf_preparing": "Preparing PDF, please wait...", + "pdf_print_failed": "Failed to invoke print function. Please try saving to PDF manually.", + "pdf_fetch_failed": "Failed to fetch HTML content, cannot generate PDF.", "preview_bilingual": "Bilingual Preview", - "preview_translatedOnly": "Translated Only Preview", - "admin_tasklist_failed": "Admin mode: Failed to load task list from server." + "preview_translatedOnly": "Translated-Only Preview" } } \ No newline at end of file diff --git a/docutranslate/static/index.html b/docutranslate/static/index.html index 4fb32e5..a9a6284 100644 --- a/docutranslate/static/index.html +++ b/docutranslate/static/index.html @@ -1 +1 @@ - DocuTranslate - 交互式文档翻译

DocuTranslate

如果上传的文件本身是.md格式,此项可不选。
mineru VLM是更新的内测模型。

选择一个或多个CSV文件。文件需包含'src'和'dst'两列标题,分别代表原文和译文。

GitHub主页(欢迎star❤):
https://github.com/xunbu/docutranslate

交流QQ群: 1047781902

任务列表

当前没有任务,点击“新建任务”开始吧!

预览
原文
译文
\ No newline at end of file + DocuTranslate - 交互式文档翻译

DocuTranslate

如果上传的文件本身是.md格式,此项可不选。
mineru VLM是更新的内测模型。

选择一个或多个CSV文件。文件需包含'src'和'dst'两列标题,分别代表原文和译文。

GitHub主页(欢迎star❤):
https://github.com/xunbu/docutranslate

交流QQ群: 1047781902

任务列表

当前没有任务,点击“新建任务”开始吧!

预览
原文
译文
\ No newline at end of file diff --git a/docutranslate/translator/ai_translator/base.py b/docutranslate/translator/ai_translator/base.py index 6050417..50dc464 100644 --- a/docutranslate/translator/ai_translator/base.py +++ b/docutranslate/translator/ai_translator/base.py @@ -53,8 +53,6 @@ class AiTranslator(Translator[T]): logger=self.logger, ) self.glossary_agent = GlossaryAgent(glossary_agent_config) - def get_glossary_dict(self): - return self.glossary_dict_gen @abstractmethod def translate(self, document: T) -> Document: ... diff --git a/docutranslate/translator/ai_translator/html_translator.py b/docutranslate/translator/ai_translator/html_translator.py index ecf0406..023d174 100644 --- a/docutranslate/translator/ai_translator/html_translator.py +++ b/docutranslate/translator/ai_translator/html_translator.py @@ -217,8 +217,8 @@ class HtmlTranslator(AiTranslator): return self if self.glossary_agent: - glossary_dict = await self.glossary_agent.send_segments_async(original_texts, self.chunk_size) - self.translate_agent.update_glossary_dict(glossary_dict) + self.glossary_dict_gen = await self.glossary_agent.send_segments_async(original_texts, self.chunk_size) + self.translate_agent.update_glossary_dict(self.glossary_dict_gen) translated_texts = await self.translate_agent.send_segments_async(original_texts, self.chunk_size) document.content = await asyncio.to_thread( diff --git a/docutranslate/translator/ai_translator/srt_translator.py b/docutranslate/translator/ai_translator/srt_translator.py index 7660b7e..46e7b8f 100644 --- a/docutranslate/translator/ai_translator/srt_translator.py +++ b/docutranslate/translator/ai_translator/srt_translator.py @@ -129,8 +129,8 @@ class SrtTranslator(AiTranslator): return self if self.glossary_agent: - glossary_dict = await self.glossary_agent.send_segments_async(original_texts, self.chunk_size) - self.translate_agent.update_glossary_dict(glossary_dict) + self.glossary_dict_gen = await self.glossary_agent.send_segments_async(original_texts, self.chunk_size) + self.translate_agent.update_glossary_dict(self.glossary_dict_gen) # --- 步骤 2: 调用翻译Agent (异步) --- translated_texts = await self.translate_agent.send_segments_async(original_texts, self.chunk_size) diff --git a/docutranslate/translator/ai_translator/txt_translator.py b/docutranslate/translator/ai_translator/txt_translator.py index 51da2e0..1364936 100644 --- a/docutranslate/translator/ai_translator/txt_translator.py +++ b/docutranslate/translator/ai_translator/txt_translator.py @@ -47,8 +47,8 @@ class TXTTranslator(AiTranslator): chunks: list[str] = split_markdown_text(document.content.decode(), max_block_size=self.chunk_size) if self.glossary_agent: - glossary_dict = await self.glossary_agent.send_segments_async(chunks, self.chunk_size) - self.translate_agent.update_glossary_dict(glossary_dict) + self.glossary_dict_gen = await self.glossary_agent.send_segments_async(chunks, self.chunk_size) + self.translate_agent.update_glossary_dict(self.glossary_dict_gen) self.logger.info(f"txt分为{len(chunks)}块") result: list[str] = await self.translate_agent.send_chunks_async(chunks) diff --git a/docutranslate/workflow/base.py b/docutranslate/workflow/base.py index 0f38bb2..39f703e 100644 --- a/docutranslate/workflow/base.py +++ b/docutranslate/workflow/base.py @@ -61,4 +61,5 @@ class Workflow(ABC, Generic[T_Config, T_original, T_Translated]): return self def get_attachment(self): + print(f"attachment:{self.attachment.attachment_dict}") return self.attachment