diff --git a/docutranslate/app.py b/docutranslate/app.py
index 6326d98..adb2cf3 100644
--- a/docutranslate/app.py
+++ b/docutranslate/app.py
@@ -65,6 +65,9 @@ from docutranslate.workflow.base import Workflow
from docutranslate.workflow.docx_workflow import DocxWorkflow, DocxWorkflowConfig
from docutranslate.workflow.epub_workflow import EpubWorkflow, EpubWorkflowConfig
from docutranslate.workflow.html_workflow import HtmlWorkflow, HtmlWorkflowConfig
+# --- 新增的 Import ---
+from docutranslate.workflow.pptx_workflow import PPTXWorkflow, PPTXWorkflowConfig
+# ----------------------
from docutranslate.workflow.interfaces import DocxExportable, EpubExportable
from docutranslate.workflow.interfaces import (
HTMLExportable,
@@ -75,6 +78,7 @@ from docutranslate.workflow.interfaces import (
SrtExportable,
CsvExportable,
AssExportable,
+ PPTXExportable, # Added PPTXExportable
)
from docutranslate.workflow.json_workflow import JsonWorkflow, JsonWorkflowConfig
from docutranslate.workflow.md_based_workflow import (
@@ -88,9 +92,7 @@ from docutranslate.workflow.xlsx_workflow import XlsxWorkflow, XlsxWorkflowConfi
if DOCLING_EXIST or TYPE_CHECKING:
from docutranslate.converter.x2md.converter_docling import ConverterDoclingConfig
from docutranslate.converter.x2md.converter_mineru import ConverterMineruConfig
-# --- 新增的 Import ---
from docutranslate.converter.x2md.converter_mineru_deploy import ConverterMineruDeployConfig
-# ----------------------
from docutranslate.exporter.md.md2html_exporter import MD2HTMLExporterConfig
from docutranslate.exporter.txt.txt2html_exporter import TXT2HTMLExporterConfig
from docutranslate.translator.ai_translator.md_translator import MDTranslatorConfig
@@ -108,8 +110,8 @@ from docutranslate.exporter.epub.epub2html_exporter import Epub2HTMLExporterConf
from docutranslate.translator.ai_translator.html_translator import HtmlTranslatorConfig
from docutranslate.translator.ai_translator.ass_translator import AssTranslatorConfig
from docutranslate.exporter.ass.ass2html_exporter import Ass2HTMLExporterConfig
-
-# ------------------------------------
+from docutranslate.translator.ai_translator.pptx_translator import PPTXTranslatorConfig
+from docutranslate.exporter.pptx.pptx2html_exporter import PPTX2HTMLExporterConfig
from docutranslate.logger import global_logger
from docutranslate.translator import default_params
@@ -133,6 +135,7 @@ WORKFLOW_DICT: Dict[str, Type[Workflow]] = {
"epub": EpubWorkflow,
"html": HtmlWorkflow,
"ass": AssWorkflow,
+ "pptx": PPTXWorkflow, # Added PPTXWorkflow
}
# --- 媒体类型映射 ---
@@ -148,6 +151,7 @@ MEDIA_TYPES = {
"srt": "text/plain; charset=utf-8",
"epub": "application/epub+zip",
"ass": "text/plain; charset=utf-8",
+ "pptx": "application/vnd.openxmlformats-officedocument.presentationml.presentation", # Added PPTX MIME
}
@@ -609,6 +613,25 @@ class AssWorkflowParams(BaseWorkflowParams):
# --- ASS WORKFLOW PARAMS END ---
+# --- PPTX WORKFLOW PARAMS START ---
+class PPTXWorkflowParams(BaseWorkflowParams):
+ workflow_type: Literal["pptx"] = Field(
+ ..., description="指定使用PPTX的翻译工作流。"
+ )
+ insert_mode: Literal["replace", "append", "prepend"] = Field(
+ "replace",
+ description="翻译文本的插入模式。'replace':替换原文,'append':附加到原文后,'prepend':附加到原文前。",
+ )
+ separator: str = Field(
+ "\n",
+ description="当 insert_mode 为 'append' 或 'prepend' 时,用于分隔原文和译文的分隔符。",
+ )
+ # target_cjk_font removed as per request
+
+
+# --- PPTX WORKFLOW PARAMS END ---
+
+
# 3. 使用可辨识联合类型(Discriminated Union)将它们组合起来
TranslatePayload = Annotated[
Union[
@@ -621,6 +644,7 @@ TranslatePayload = Annotated[
EpubWorkflowParams,
HtmlWorkflowParams,
AssWorkflowParams,
+ PPTXWorkflowParams,
],
Field(discriminator="workflow_type"),
]
@@ -639,6 +663,7 @@ class TranslateServiceRequest(BaseModel):
"my_book.epub",
"index.html",
"dialogue.ass",
+ "presentation.pptx",
],
)
file_content: str = Field(
@@ -864,6 +889,26 @@ class TranslateServiceRequest(BaseModel):
"retry": default_params["retry"],
},
},
+ {
+ "file_name": "presentation.pptx",
+ "file_content": "UEsDBBQAAAAIA... (base64-encoded pptx)",
+ "payload": {
+ "workflow_type": "pptx",
+ "skip_translate": False,
+ "base_url": "https://api.openai.com/v1",
+ "api_key": "sk-your-api-key-here",
+ "model_id": "gpt-4o",
+ "to_lang": "中文",
+ "insert_mode": "replace",
+ "separator": "\n",
+ "chunk_size": default_params["chunk_size"],
+ "concurrent": default_params["concurrent"],
+ "temperature": default_params["temperature"],
+ "timeout": default_params["timeout"],
+ "thinking": "default",
+ "retry": default_params["retry"],
+ },
+ },
]
}
)
@@ -1283,6 +1328,46 @@ async def _perform_translation(
workflow = AssWorkflow(config=workflow_config)
# --- ASS WORKFLOW LOGIC END ---
+ # --- PPTX WORKFLOW LOGIC START ---
+ elif isinstance(payload, PPTXWorkflowParams):
+ task_logger.info("构建 PPTXWorkflow 配置。")
+ translator_args = payload.model_dump(
+ include={
+ "skip_translate",
+ "base_url",
+ "api_key",
+ "model_id",
+ "to_lang",
+ "custom_prompt",
+ "temperature",
+ "thinking",
+ "chunk_size",
+ "concurrent",
+ "insert_mode",
+ "separator",
+ "glossary_dict",
+ "timeout",
+ "retry",
+ "system_proxy_enable",
+ "force_json",
+ },
+ exclude_none=True,
+ )
+ translator_args["glossary_generate_enable"] = (
+ payload.glossary_generate_enable
+ )
+ translator_args["glossary_agent_config"] = build_glossary_agent_config()
+ translator_config = PPTXTranslatorConfig(**translator_args)
+
+ html_exporter_config = PPTX2HTMLExporterConfig(cdn=True)
+ workflow_config = PPTXWorkflowConfig(
+ translator_config=translator_config,
+ html_exporter_config=html_exporter_config,
+ logger=task_logger,
+ )
+ workflow = PPTXWorkflow(config=workflow_config)
+ # --- PPTX WORKFLOW LOGIC END ---
+
else:
raise TypeError(f"工作流类型 '{payload.workflow_type}' 的处理逻辑未实现。")
@@ -1313,30 +1398,7 @@ async def _perform_translation(
# 定义导出函数映射
export_map = {}
- # 根据 workflow 的类型填充导出映射
- if isinstance(workflow, HTMLExportable):
- html_config = None
- if isinstance(workflow, MarkdownBasedWorkflow):
- html_config = MD2HTMLExporterConfig(cdn=is_cdn_available)
- elif isinstance(workflow, TXTWorkflow):
- html_config = TXT2HTMLExporterConfig(cdn=is_cdn_available)
- elif isinstance(workflow, JsonWorkflow):
- html_config = Json2HTMLExporterConfig(cdn=is_cdn_available)
- elif isinstance(workflow, XlsxWorkflow):
- html_config = Xlsx2HTMLExporterConfig(cdn=is_cdn_available)
- elif isinstance(workflow, DocxWorkflow):
- html_config = Docx2HTMLExporterConfig(cdn=is_cdn_available)
- elif isinstance(workflow, SrtWorkflow):
- html_config = Srt2HTMLExporterConfig(cdn=is_cdn_available)
- elif isinstance(workflow, EpubWorkflow):
- html_config = Epub2HTMLExporterConfig(cdn=is_cdn_available)
- elif isinstance(workflow, AssWorkflow):
- html_config = Ass2HTMLExporterConfig(cdn=is_cdn_available)
- export_map["html"] = (
- lambda: workflow.export_to_html(html_config),
- f"{filename_stem}_translated.html",
- True,
- )
+
if isinstance(workflow, MDFormatsExportable):
export_map["markdown"] = (
workflow.export_to_markdown,
@@ -1396,6 +1458,39 @@ async def _perform_translation(
f"{filename_stem}_translated.ass",
True,
)
+ if isinstance(workflow, PPTXExportable):
+ export_map["pptx"] = (
+ workflow.export_to_pptx,
+ f"{filename_stem}_translated.pptx",
+ False,
+ )
+
+ # 根据 workflow 的类型填充导出映射
+ if isinstance(workflow, HTMLExportable):
+ html_config = None
+ if isinstance(workflow, MarkdownBasedWorkflow):
+ html_config = MD2HTMLExporterConfig(cdn=is_cdn_available)
+ elif isinstance(workflow, TXTWorkflow):
+ html_config = TXT2HTMLExporterConfig(cdn=is_cdn_available)
+ elif isinstance(workflow, JsonWorkflow):
+ html_config = Json2HTMLExporterConfig(cdn=is_cdn_available)
+ elif isinstance(workflow, XlsxWorkflow):
+ html_config = Xlsx2HTMLExporterConfig(cdn=is_cdn_available)
+ elif isinstance(workflow, DocxWorkflow):
+ html_config = Docx2HTMLExporterConfig(cdn=is_cdn_available)
+ elif isinstance(workflow, SrtWorkflow):
+ html_config = Srt2HTMLExporterConfig(cdn=is_cdn_available)
+ elif isinstance(workflow, EpubWorkflow):
+ html_config = Epub2HTMLExporterConfig(cdn=is_cdn_available)
+ elif isinstance(workflow, AssWorkflow):
+ html_config = Ass2HTMLExporterConfig(cdn=is_cdn_available)
+ elif isinstance(workflow, PPTXWorkflow):
+ html_config = PPTX2HTMLExporterConfig(cdn=is_cdn_available)
+ export_map["html"] = (
+ lambda: workflow.export_to_html(html_config),
+ f"{filename_stem}_translated.html",
+ True,
+ )
# 循环生成文件
for file_type, (export_func, filename, is_string_output) in export_map.items():
@@ -1616,7 +1711,7 @@ def _cancel_translation_logic(task_id: str):
description="""
接收一个包含文件内容(Base64编码)和工作流参数的JSON请求,启动一个后台翻译任务。
-- **工作流选择**: 请求体中的 `payload.workflow_type` 字段决定了本次任务的类型(如 `markdown_based`, `txt`, `json`, `xlsx`, `docx`, `srt`, `epub`, `html`, `ass`)。
+- **工作流选择**: 请求体中的 `payload.workflow_type` 字段决定了本次任务的类型(如 `markdown_based`, `txt`, `json`, `xlsx`, `docx`, `srt`, `epub`, `html`, `ass`, `pptx`)。
- **动态参数**: 根据所选工作流,API需要不同的参数集。请参考下面的Schema或示例。
- **异步处理**: 此端点会立即返回任务ID,客户端需轮询状态接口获取进度。
""",
@@ -1960,6 +2055,27 @@ async def service_release_task(task_id: str):
},
},
# --- ASS STATUS EXAMPLE END ---
+ # --- PPTX STATUS EXAMPLE START ---
+ "completed_pptx": {
+ "summary": "已完成 (PPTX)",
+ "value": {
+ "task_id": "a1b2c3d6",
+ "is_processing": False,
+ "status_message": "翻译成功!用时 30.50 秒。",
+ "error_flag": False,
+ "download_ready": True,
+ "original_filename_stem": "presentation",
+ "original_filename": "presentation.pptx",
+ "task_start_time": 1678890300.0,
+ "task_end_time": 1678890330.50,
+ "downloads": {
+ "pptx": "/service/download/a1b2c3d6/pptx",
+ "html": "/service/download/a1b2c3d6/html",
+ },
+ "attachment": {},
+ },
+ },
+ # --- PPTX STATUS EXAMPLE END ---
"error": {
"summary": "失败",
"value": {
@@ -2052,6 +2168,7 @@ FileType = Literal[
"srt",
"epub",
"ass",
+ "pptx",
]
@@ -2077,6 +2194,9 @@ FileType = Literal[
"application/epub+zip": {
"schema": {"type": "string", "format": "binary"}
},
+ "application/vnd.openxmlformats-officedocument.presentationml.presentation": {
+ "schema": {"type": "string", "format": "binary"}
+ },
},
},
404: {
@@ -2092,7 +2212,7 @@ async def service_download_file(
file_type: FileType = FastApiPath(
...,
description="要下载的文件类型。",
- examples=["html", "json", "csv", "docx", "srt", "epub", "ass"],
+ examples=["html", "json", "csv", "docx", "srt", "epub", "ass", "pptx"],
),
):
task_state = tasks_state.get(task_id)
@@ -2198,6 +2318,14 @@ async def service_download_attachment(
"content": "UEsDBBQAAAAIA... (base64-encoded string)",
},
},
+ "pptx_base64": {
+ "summary": "PPTX 内容 (Base64)",
+ "value": {
+ "file_type": "pptx",
+ "filename": "my_presentation_translated.pptx",
+ "content": "UEsDBBQAAAAIA... (base64-encoded string)",
+ },
+ },
}
}
},
@@ -2215,7 +2343,7 @@ async def service_content(
file_type: FileType = FastApiPath(
...,
description="要获取内容的文件类型。",
- examples=["html", "json", "csv", "docx", "srt", "epub", "ass"],
+ examples=["html", "json", "csv", "docx", "srt", "epub", "ass", "pptx"],
),
):
task_state = tasks_state.get(task_id)
diff --git a/docutranslate/static/i18nData.json b/docutranslate/static/i18nData.json
index c045479..4e1ee00 100644
--- a/docutranslate/static/i18nData.json
+++ b/docutranslate/static/i18nData.json
@@ -13,6 +13,7 @@
"workflowOptionAss": "ASS字幕翻译 (.ass)",
"workflowOptionJson": "JSON翻译 (.json)",
"workflowOptionHtml": "HTML翻译 (.html)",
+ "workflowOptionPptx": "PPTX演示文稿 (.pptx)",
"autoWorkflowLabel": "自动选择工作流",
"txtSettingsTitleText": "TXT翻译选项",
"insertModeLabel": "插入模式",
@@ -48,6 +49,8 @@
"insertModeHelpAss": "选择如何将翻译后的文本插入。",
"separatorPlaceholderAss": "例如: \\N (换行符)",
"separatorHelpAss": "当插入模式为附加或前置时,用于分隔原文和译文的字符。\\N 是ASS格式的换行符。",
+ "pptxSettingsTitleText": "PPTX翻译选项",
+ "insertModeHelpPptx": "选择如何将翻译后的文本插入文本框。",
"jsonSettingsTitleText": "JSON路径配置",
"jsonPathLabel": "需要翻译的JSON路径",
"jsonPathPlaceholder": "每行一个路径, 例如:\n$.name\n$.*",
@@ -55,7 +58,6 @@
"parsingSettingsTitleText": "解析配置",
"parsingEngineLabel": "解析引擎",
"parsingEngineHelp": "如果上传的文件本身是.md格式,此项可不选。",
- "getMineruTokenTitle": "获取Mineru Token",
"mineruTokenPlaceholder": "使用Mineru引擎时需要",
"modelVersionLabel": "Mineru 模型版本",
"modelVersionVlm": "VLM",
@@ -80,7 +82,6 @@
"platformCustom": "自定义接口",
"baseUrlLabel": "API 地址 (Base URL)",
"baseUrlPlaceholder": "OpenAi兼容地址",
- "getApiKeyTitle": "获取API Key",
"apiKeyPlaceholder": "请输入您的API Key",
"modelIdLabel": "模型ID",
"modelIdPlaceholder": "例如: gpt-4o, glm-4",
@@ -115,8 +116,6 @@
"glossaryGenConfigCustom": "自定义",
"importConfigBtn": "导入配置",
"exportConfigBtn": "导出配置",
- "githubInfo": "GitHub主页(欢迎star❤):
\n https://github.com/xunbu/docutranslate",
- "qqGroupInfo": "交流QQ群: 1047781902",
"taskListTitle": "任务列表",
"newTaskBtn": "新建任务",
"noTaskPlaceholder": "当前没有任务,点击“新建任务”开始吧!",
@@ -144,7 +143,7 @@
"closeBtn": "关闭",
"downloadBtn": "下载",
"tutorialModalTitle": "使用教程",
- "tutorialModalBody": "
视频教程可以在B站搜索 docutranslate 获取。
欢迎使用 DocuTranslate!请按照以下步骤完成文档翻译:
在左侧配置面板的顶部,首先选择最适合您文件类型的处理流程。
.txt 纯文本文件。.epub 电子书文件。.docx Word文档。.xlsx 或 .csv 电子表格文件。.srt 字幕文件。.ass 特效字幕文件。.json 文件中的特定字段。.html 网页文件。选择工作流后,下方会显示相关的配置选项。请依次完成设置(所有配置都会自动保存在您的浏览器中):
A. 工作流特定选项 (根据您第一步的选择出现):
minerU 引擎,需要在此处填入您的Token。\\N,EPUB格式常用 <br /> 作为换行分隔符)。$.*(翻译全部字符串),$..description(翻译所有键为description的值)。B. 通用选项 (适用于所有工作流):
在右侧的任务列表中,点击或拖拽您的文档到文件上传区域。
文件选择成功后,点击任务卡片右下角的 开始翻译 按钮。系统将开始处理任务,您可以在日志区域查看实时进度。
翻译完成后,任务卡片下方会出现操作按钮:
视频教程可以在B站搜索 docutranslate 获取。
欢迎使用 DocuTranslate!请按照以下步骤完成文档翻译:
在左侧配置面板的顶部,首先选择最适合您文件类型的处理流程。
.txt 纯文本文件。.epub 电子书文件。.docx Word文档。.xlsx 或 .csv 电子表格文件。.pptx 幻灯片文件。.srt 字幕文件。.ass 特效字幕文件。.json 文件中的特定字段。.html 网页文件。选择工作流后,下方会显示相关的配置选项。请依次完成设置(所有配置都会自动保存在您的浏览器中):
A. 工作流特定选项 (根据您第一步的选择出现):
minerU 引擎,需要在此处填入您的Token。\\N,EPUB格式常用 <br /> 作为换行分隔符)。$.*(翻译全部字符串),$..description(翻译所有键为description的值)。B. 通用选项 (适用于所有工作流):
在右侧的任务列表中,点击或拖拽您的文档到文件上传区域。
文件选择成功后,点击任务卡片右下角的 开始翻译 按钮。系统将开始处理任务,您可以在日志区域查看实时进度。
翻译完成后,任务卡片下方会出现操作按钮:
\\N is the newline character for the ASS format.",
+ "pptxSettingsTitleText": "PPTX Translation Options",
+ "insertModeHelpPptx": "Choose how to insert the translated text into text boxes.",
"jsonSettingsTitleText": "JSON Path Configuration",
"jsonPathLabel": "JSON Paths to Translate",
"jsonPathPlaceholder": "One path per line, e.g.:\n$.name\n$.*",
@@ -250,7 +252,6 @@
"parsingSettingsTitleText": "Parsing Configuration",
"parsingEngineLabel": "Parsing Engine",
"parsingEngineHelp": "If the uploaded file is already in .md format, this can be skipped.",
- "getMineruTokenTitle": "Get Mineru Token",
"mineruTokenPlaceholder": "Required when using the Mineru engine",
"modelVersionLabel": "Mineru Model Version",
"modelVersionVlm": "VLM",
@@ -275,7 +276,6 @@
"platformCustom": "Custom API",
"baseUrlLabel": "API Address (Base URL)",
"baseUrlPlaceholder": "OpenAI-compatible address",
- "getApiKeyTitle": "Get API Key",
"apiKeyPlaceholder": "Please enter your API Key",
"modelIdLabel": "Model ID",
"modelIdPlaceholder": "e.g., gpt-4o, glm-4",
@@ -310,8 +310,6 @@
"glossaryGenConfigCustom": "Custom",
"importConfigBtn": "Import Config",
"exportConfigBtn": "Export Config",
- "githubInfo": "GitHub Page (stars❤ welcome): Video tutorials are available on Bilibili by searching for docutranslate.
Welcome to DocuTranslate! Please follow these steps to translate your documents:
At the top of the left-side configuration panel, first choose the processing flow that best suits your file type.
.txt plain text files..epub e-book files..docx Word documents..xlsx or .csv spreadsheet files..srt subtitle files..ass advanced subtitle files..json files..html web page files.After selecting a workflow, the relevant configuration options will appear below. Please complete the settings in order (all configurations are automatically saved in your browser):
A. Workflow-Specific Options (Appears based on your choice in Step 1):
minerU engine, you need to enter your token here.\\\\N is common for ASS format, <br /> for EPUB format as a line break).$.* (translate all strings), $..description (translate all values with the key description).B. General Options (Applicable to all workflows):
In the task list on the right, click or drag your document into the file upload area.
Once the file is successfully selected, click the Start Translation button on the bottom right of the task card. The system will begin processing the task, and you can view the real-time progress in the log area.
After the translation is complete, action buttons will appear on the task card:
Video tutorials are available on Bilibili by searching for docutranslate.
Welcome to DocuTranslate! Please follow these steps to translate your documents:
At the top of the left-side configuration panel, first choose the processing flow that best suits your file type.
.txt plain text files..epub e-book files..docx Word documents..xlsx or .csv spreadsheet files..pptx slide files..srt subtitle files..ass advanced subtitle files..json files..html web page files.After selecting a workflow, the relevant configuration options will appear below. Please complete the settings in order (all configurations are automatically saved in your browser):
A. Workflow-Specific Options (Appears based on your choice in Step 1):
minerU engine, you need to enter your token here.\\\\N is common for ASS format, <br /> for EPUB format as a line break).$.* (translate all strings), $..description (translate all values with the key description).B. General Options (Applicable to all workflows):
In the task list on the right, click or drag your document into the file upload area.
Once the file is successfully selected, click the Start Translation button on the bottom right of the task card. The system will begin processing the task, and you can view the real-time progress in the log area.
After the translation is complete, action buttons will appear on the task card:
GitHub主页(欢迎star❤):
https://github.com/xunbu/docutranslate
交流QQ群: 1047781902
version:{{ version ? 'v' + version : '' }}
{{ t('noTaskPlaceholder') }}
{{ task.backendId || t('taskCardIdPlaceholder') }}
{{ t('taskCardFileDrop') }}
{{ t('taskCardFileSelected') }}
GitHub主页(欢迎star❤):
https://github.com/xunbu/docutranslate
交流QQ群: 1047781902
version:{{ version ? 'v' + version : '' }}
{{ t('noTaskPlaceholder') }}
{{ task.backendId || t('taskCardIdPlaceholder') }}
{{ t('taskCardFileDrop') }}
{{ t('taskCardFileSelected') }}