From 37e2866a3fbce9a280be61e667b1251a8b17361b Mon Sep 17 00:00:00 2001 From: xunbu Date: Fri, 22 Aug 2025 10:22:32 +0800 Subject: [PATCH] =?UTF-8?q?=E5=A2=9E=E5=A4=A7mineru=E5=B9=B6=E5=8F=91?= =?UTF-8?q?=E6=95=B0?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- docutranslate/converter/x2md/converter_mineru.py | 12 +++++++----- 1 file changed, 7 insertions(+), 5 deletions(-) diff --git a/docutranslate/converter/x2md/converter_mineru.py b/docutranslate/converter/x2md/converter_mineru.py index 8e5cf3b..43db090 100644 --- a/docutranslate/converter/x2md/converter_mineru.py +++ b/docutranslate/converter/x2md/converter_mineru.py @@ -21,7 +21,7 @@ class ConverterMineruConfig(X2MarkdownConverterConfig): model_version: Literal["pipeline", "vlm"] = "vlm" def gethash(self) -> Hashable: - return self.formula_ocr,self.model_version + return self.formula_ocr, self.model_version timeout = httpx.Timeout( @@ -36,8 +36,10 @@ timeout = httpx.Timeout( # else: # client = httpx.Client(trust_env=False, timeout=timeout, proxy=None, verify=False) # client_async = httpx.AsyncClient(trust_env=False, timeout=timeout, proxy=None, verify=False) -client = httpx.Client(trust_env=False, timeout=timeout, proxy=None, verify=False) -client_async = httpx.AsyncClient(trust_env=False, timeout=timeout, proxy=None, verify=False) + +limits = httpx.Limits(max_connections=500, max_keepalive_connections=20) +client = httpx.Client(limits=limits, trust_env=False, timeout=timeout, proxy=None, verify=False) +client_async = httpx.AsyncClient(limits=limits, trust_env=False, timeout=timeout, proxy=None, verify=False) class ConverterMineru(X2MarkdownConverter): @@ -45,7 +47,7 @@ class ConverterMineru(X2MarkdownConverter): super().__init__(config=config) self.mineru_token = config.mineru_token.strip() self.formula = config.formula_ocr - self.model_version=config.model_version + self.model_version = config.model_version def _get_header(self): return { @@ -58,7 +60,7 @@ class ConverterMineru(X2MarkdownConverter): "enable_formula": self.formula, "language": "auto", "enable_table": True, - "model_version":self.model_version, + "model_version": self.model_version, "files": [ {"name": f"{document.name}", "is_ocr": True} ]