1.新增视觉能力 2.新增对上次图片或上传图片引用图片做编辑能力.

2026-03-20 16:13:19 +08:00
parent 8e65682dba
commit adc7e70c1f
7 changed files with 362 additions and 205 deletions
--- a/src/server/deep_agent/tools/generate_furniture_sketch.py
+++ b/src/server/deep_agent/tools/generate_furniture_sketch.py
@@ -1,36 +1,37 @@
-import json
-import logging
-import os
 import uuid
-from pathlib import Path
-from typing import Annotated
-
 import httpx
-from google.oauth2 import service_account
-from langchain_core.tools import tool
-from google import genai
-from google.genai.types import GenerateContentConfig, Modality
-from langgraph.prebuilt import ToolRuntime
+import logging

 from minio import Minio
+from google import genai
+from pathlib import Path
+from datetime import datetime
+from langchain_core.tools import tool
+from google.oauth2 import service_account
+from langgraph.prebuilt import ToolRuntime

-from src.core.config import settings
-from src.server.utils.new_oss_client import oss_upload_image, oss_get_image, is_minio_file_exist, oss_upload_image_file
+from src.core.config import settings, MONGO_URI
+from src.server.deep_agent.utils.mongodb_util import ThreadImageMinIOStore
+
+# from google.genai.types import GenerateContentConfig, Modality
+# from langgraph.config import get_stream_writer
+# from src.server.utils.new_oss_client import oss_upload_image, oss_get_image, is_minio_file_exist, oss_upload_image_file
+
+# 初始化全局凭证和客户端
+# creds = service_account.Credentials.from_service_account_file(
+#     settings.GOOGLE_GENAI_USE_VERTEXAI,
+#     scopes=["https://www.googleapis.com/auth/cloud-platform"],
+# )
+# client = genai.Client(
+#     credentials=creds,
+#     project=settings.GOOGLE_CLOUD_PROJECT,
+#     location=settings.GOOGLE_CLOUD_LOCATION,
+#     vertexai=True
+# )

 logger = logging.getLogger(__name__)
-# 初始化全局凭证和客户端
-creds = service_account.Credentials.from_service_account_file(
-    settings.GOOGLE_GENAI_USE_VERTEXAI,
-    scopes=["https://www.googleapis.com/auth/cloud-platform"],
-)
-
 minio_client = Minio(settings.MINIO_URL, access_key=settings.MINIO_ACCESS, secret_key=settings.MINIO_SECRET, secure=settings.MINIO_SECURE)
-client = genai.Client(
-    credentials=creds,
-    project=settings.GOOGLE_CLOUD_PROJECT,
-    location=settings.GOOGLE_CLOUD_LOCATION,
-    vertexai=True
-)
+image_store = ThreadImageMinIOStore(MONGO_URI, "agent_tool_generate_db")


 def is_image_path_exist(image_path):
@@ -47,6 +48,7 @@ def create_generate_furniture_tool(workspace_dir, width: int = 1024, height: int
        使用 Gemini 图像生成模型根据详细的英文提示词生成家具设计草图。
        """
        logger.info(f"\n[系统日志] 正在调用 generate_furniture ...")
+        thread_id = runtime.config.get("configurable").get("thread_id")
        try:
            # 1. 生成图像 - local flux2-klein
            object_name = f"furniture/sketches/{uuid.uuid4()}.png"
@@ -67,15 +69,7 @@ def create_generate_furniture_tool(workspace_dir, width: int = 1024, height: int
            image_url = result.get("output_path", None)

            if image_url:
-                filename = os.path.join(workspace_dir, image_url)
-                # 2. 创建本地目录（确保目录存在）
-                local_dir = os.path.dirname(filename)
-                if not os.path.exists(local_dir):
-                    os.makedirs(local_dir, exist_ok=True)
-
-                img = oss_get_image(oss_client=minio_client, bucket=image_url.split('/')[0], object_name=image_url[image_url.find('/') + 1:])
-                img.save(filename)
-
+                image_store.save_image_path(thread_id=thread_id, object_path=image_url, metadata={"prompt": prompt, "generated_at": str(datetime.now())})
                return image_url
            else:
                return f"Image generation failed."
@@ -89,65 +83,42 @@ def create_generate_furniture_tool(workspace_dir, width: int = 1024, height: int

 def create_edit_furniture_tool(workspace_dir, width: int = 1024, height: int = 1024):
    @tool
-    async def edit_furniture(prompt: str, input_image_path) -> str:
+    async def edit_furniture(prompt: str, runtime: ToolRuntime) -> str:
        """
        使用图像生成模型根据详细的英文提示词编辑家具设计草图。
        """
        logger.info(f"\n[系统日志] 正在调用 edit_furniture ...")
-
+        thread_id = runtime.config.get("configurable").get("thread_id")
        try:
-            # 0. 编辑前先检查工作环境和minio上是否存在该图像
-            input_image_path = input_image_path.lstrip('/')
-            filename = os.path.join(workspace_dir, input_image_path)
-            local_exist = is_image_path_exist(filename)
-            minio_exist = is_minio_file_exist(minio_client=minio_client, bucket_name=input_image_path.split('/')[0], object_name=input_image_path.split('/')[0])
+            current_image_path = image_store.get_image_path(thread_id).get("current_image_path", False)
+            input_image_path = runtime.state.get("files").get("input_image", False)
+            if input_image_path or current_image_path:
+                input_path = [path for path in (input_image_path, current_image_path) if path]
+                object_name = f"furniture/sketches/{uuid.uuid4()}.png"
+                bucket_name = "fida-test"  # 替换为你的 bucket 名称
+                request_data = {
+                    "input_image_paths": input_path,
+                    "prompt": prompt,
+                    "bucket_name": bucket_name,
+                    "object_name": object_name,
+                    "width": width,
+                    "height": height
+                }
+                async with httpx.AsyncClient(timeout=120) as client:
+                    resp = await client.post(
+                        f"http://{settings.FLUX2_GEN_IMG_MODEL_URL}/predict",
+                        json=request_data,
+                    )
+                result = resp.json()
+                image_url = result.get("output_path", None)

-            if not local_exist and not minio_exist:
-                # 两个地方都不存在 直接报错
-                return f"Image generation failed."
-            elif local_exist and not minio_exist:
-                # 把本地的上传到minio
-                oss_upload_image_file(oss_client=minio_client, bucket=input_image_path.split('/')[0], object_name=input_image_path.split('/')[0], file_path=filename)
-            elif not local_exist and minio_exist:
-                # minio的下载到本地
-                img = oss_get_image(oss_client=minio_client, bucket=input_image_path.split('/')[0], object_name=input_image_path.split('/')[0], )
-                img.save(filename)
-            elif minio_exist and local_exist:
-                # 两个地方都存在 直接跳过
-                pass
-
-            # 1. 生成图像 - local flux2-klein
-            object_name = f"furniture/sketches/{uuid.uuid4()}.png"
-            bucket_name = "fida-test"  # 替换为你的 bucket 名称
-            request_data = {
-                "input_image_paths": [input_image_path],
-                "prompt": prompt,
-                "bucket_name": bucket_name,
-                "object_name": object_name,
-                "width": width,
-                "height": height
-            }
-            async with httpx.AsyncClient(timeout=120) as client:
-                resp = await client.post(
-                    f"http://{settings.FLUX2_GEN_IMG_MODEL_URL}/predict",
-                    json=request_data,
-                )
-            result = resp.json()
-            image_url = result.get("output_path", None)
-
-            if image_url:
-                filename = os.path.join(workspace_dir, image_url)
-                # 2. 创建本地目录（确保目录存在）
-                local_dir = os.path.dirname(filename)
-                if not os.path.exists(local_dir):
-                    os.makedirs(local_dir, exist_ok=True)
-
-                img = oss_get_image(oss_client=minio_client, bucket=image_url.split('/')[0], object_name=image_url[image_url.find('/') + 1:])
-                img.save(filename)
-                return image_url
+                if image_url:
+                    image_store.save_image_path(thread_id=thread_id, object_path=image_url, metadata={"prompt": prompt, "generated_at": str(datetime.now())})
+                    return image_url
+                else:
+                    return f"Image generation failed."
            else:
-                return f"Image generation failed."
-
+                return f"The picture to be edited does not exist."
        except Exception as e:
            logger.warning(f"edit_furniture error ：{e}")
            return "edit_furniture error"