增加微信聊天中图片获取能力,较之前的微信图片仅提供缩略图的情况,改善为获取微信聊天中实际图片大小,方便后续 ocr 或者 llm vision 识别聊天图片内容。

This commit is contained in:
Ethan
2025-02-24 20:17:15 +08:00
parent f75ac292db
commit c86602ebaf
2 changed files with 20 additions and 9 deletions

View File

@@ -87,7 +87,9 @@ class GewechatMessageConverter(adapter.MessageConverter):
base64_str, image_format = await image.get_gewechat_image_base64(
gewechat_url=self.config["gewechat_url"],
app_id=self.config["app_id"],
xml_content=image_xml
xml_content=image_xml,
token=self.config["token"],
image_type=2
)
return platform_message.MessageChain([

View File

@@ -9,14 +9,20 @@ import PIL.Image
import httpx
async def get_gewechat_image_base64(gewechat_url: str, app_id: str, xml_content: str, image_type: int = 2) -> \
typing.Tuple[str, str]:
async def get_gewechat_image_base64(
gewechat_url: str,
app_id: str,
xml_content: str,
token: str,
image_type: int = 2
) -> typing.Tuple[str, str]:
"""从gewechat服务器获取图片并转换为base64格式
Args:
gewechat_url (str): gewechat服务器地址
app_id (str): gewechat应用ID
xml_content (str): 图片的XML内容
token (str): Gewechat API Token
image_type (int, optional): 图片类型. Defaults to 2.
1: 高清图片
2: 常规图片
@@ -24,16 +30,19 @@ typing.Tuple[str, str]:
Returns:
typing.Tuple[str, str]: (base64编码, 图片格式)
Raises:
Exception: 当图片下载或处理失败时抛出异常
"""
headers = {
'X-GEWE-TOKEN': token,
'Content-Type': 'application/json'
}
async with aiohttp.ClientSession() as session:
# 获取图片下载链接
async with session.post(
f"{gewechat_url}/v2/api/message/downloadImage",
headers=headers,
json={
"app_id": app_id,
"appId": app_id,
"type": image_type,
"xml": xml_content
}
@@ -48,13 +57,13 @@ typing.Tuple[str, str]:
image_url = f"{gewechat_url}{resp_data['data']['fileUrl']}"
# 下载图片内容
async with session.get(image_url) as img_response:
async with session.get(image_url, headers=headers) as img_response:
if img_response.status != 200:
raise Exception(f"下载gewechat图片失败: {await img_response.text()}")
# 获取图片格式
content_type = img_response.headers.get('Content-Type', '')
image_format = content_type.split('/')[-1] # 例如 'image/jpeg' -> 'jpeg'
image_format = content_type.split('/')[-1]
# 读取图片数据并转换为base64
image_data = await img_response.read()