110 lines
4.1 KiB
Python
110 lines
4.1 KiB
Python
import asyncio
|
||
|
||
import httpx
|
||
|
||
|
||
class Agent:
|
||
def __init__(self, baseurl="", key="", model_id="", system_prompt="", temperature=0.7, max_concurrent=5):
|
||
self.baseurl = baseurl
|
||
self.key = key
|
||
self.model_id = model_id
|
||
self.system_prompt = system_prompt
|
||
self.temperature = temperature
|
||
# self.client=httpx.Client()
|
||
self.client_async = httpx.AsyncClient()
|
||
self.max_concurrent = max_concurrent
|
||
|
||
def _prepare_request_data(self, prompt, system_prompt, temperature=None, top_p=0.9):
|
||
if temperature is None:
|
||
temperature = self.temperature
|
||
headers = {"Content-Type": "application/json",
|
||
"Authorization": f"Bearer {self.key}"}
|
||
data = {
|
||
"model": self.model_id,
|
||
"messages": [
|
||
{"role": "system", "content": system_prompt},
|
||
{"role": "user", "content": prompt}
|
||
],
|
||
"temperature": temperature,
|
||
"top_p": top_p
|
||
}
|
||
return headers, data
|
||
|
||
# def send_prompt(self,prompt,system_prompt=None,timeout=50):
|
||
# if system_prompt is None:
|
||
# system_prompt=self.system_prompt
|
||
# headers,data=self._prepare_request_data(prompt,system_prompt)
|
||
# response=self.client.post(f"{self.baseurl}/chat/completions",json=data,headers=headers,timeout=timeout)
|
||
# response.raise_for_status()
|
||
# return response.json()["choices"][0]["message"]["content"].lstrip()
|
||
|
||
async def send_async(self, prompt: str, system_prompt: None | str = None, timeout: int = 200) -> str:
|
||
if system_prompt is None:
|
||
system_prompt = self.system_prompt
|
||
"""Sends a single prompt asynchronously."""
|
||
headers, data = self._prepare_request_data(prompt, system_prompt)
|
||
try:
|
||
response = await self.client_async.post(
|
||
f"{self.baseurl}/chat/completions",
|
||
json=data,
|
||
headers=headers,
|
||
timeout=timeout
|
||
)
|
||
response.raise_for_status()
|
||
result: str = response.json()["choices"][0]["message"]["content"]
|
||
return result.lstrip()
|
||
except httpx.HTTPStatusError as e:
|
||
raise Exception(f"AI请求错误 (async): {e.response.status_code} - {e.response.text}") from e
|
||
except httpx.RequestError as e:
|
||
raise Exception(f"AI请求连接错误 (async): {e}") from e
|
||
except (KeyError, IndexError) as e:
|
||
raise Exception(f"AI响应格式错误 (async): {e}") from e
|
||
|
||
async def send_prompts_async(
|
||
self,
|
||
prompts: list[str],
|
||
system_prompt: str | None = None,
|
||
timeout: int = 50,
|
||
max_concurrent: int = 5 # 新增参数,默认并发数为5
|
||
) -> list[str]:
|
||
total = len(prompts)
|
||
count = 0
|
||
"""
|
||
Sends multiple prompts asynchronously, limiting concurrent requests.
|
||
"""
|
||
semaphore = asyncio.Semaphore(max_concurrent)
|
||
tasks = []
|
||
|
||
# 辅助协程,用于包装 self.send_async 并使用信号量
|
||
async def send_with_semaphore(p_text: str):
|
||
async with semaphore: # 在进入代码块前获取信号量,退出时释放
|
||
result = await self.send_async(
|
||
prompt=p_text,
|
||
system_prompt=system_prompt,
|
||
timeout=timeout
|
||
)
|
||
nonlocal count
|
||
count += 1
|
||
print(f"进行到{count}/{total}")
|
||
return result
|
||
|
||
for p_text in prompts:
|
||
task = asyncio.create_task(send_with_semaphore(p_text))
|
||
tasks.append(task)
|
||
|
||
results = await asyncio.gather(*tasks, return_exceptions=False)
|
||
return results
|
||
|
||
def send_prompts(
|
||
self,
|
||
prompts: list[str],
|
||
system_prompt: str | None = None,
|
||
timeout: int = 50,
|
||
) -> list[str]:
|
||
result = asyncio.run(self.send_prompts_async(prompts, system_prompt, timeout, self.max_concurrent))
|
||
return result
|
||
|
||
|
||
if __name__ == '__main__':
|
||
pass
|