1 month ago · cb25eb918f
--- a/landsite_agent/config.py
+++ b/landsite_agent/config.py
@@ -16,12 +16,10 @@ model_list: Dict[str, Dict[str, Any]] = {
 
															         "api_base": "http://ac.zjugis.com:8511/v1",
														
 
															         "model_name": "qwen2.5-instruct"
														
 
															     },
														
 
															-    "azure": {
														
 
															-        "api_key": "your-azure-api-key",
														
 
															-        "api_base": "https://your-azure-endpoint.openai.azure.com",
														
 
															-        "model_name": "gpt-35-turbo",
														
 
															-        "temperature": 0,
														
 
															-        "max_tokens": 2000
														
 
															+    "zjstai": {
														
 
															+        "api_key": "none",
														
 
															+        "api_base": "http://172.27.27.20:20331/v1",
														
 
															+        "model_name": "DeepSeek-R1-Distill-Qwen-32B",
														
 
															     },
														
 
															     "local": {
														
 
															         "api_key": "your-local-api-key",
														
@@ -32,6 +30,9 @@ model_list: Dict[str, Dict[str, Any]] = {
 
															     }
														
 
															 }
														
 
															+# 新增全局默认模型类型开关
														
 
															+DEFAULT_MODEL_TYPE = "openai"
														
 
															+
														
 
															 def get_model_config(model_type: str = "openai") -> ModelConfig:
														
 
															     """
														
 
															     获取模型配置
														
--- a/landsite_agent/database.py
+++ b/landsite_agent/database.py
@@ -18,6 +18,14 @@ db_list: dict[str, dict[Any, Any] | dict[str, str]] = {
 
															     }
														
 
															 }
														
 
															+# 向量模型配置
														
 
															+vector_model_config: dict[str, dict[str, str]] = {
														
 
															+    "m3e-base": {
														
 
															+        "model_path": r"E:\项目临时\AI大模型\m3e-base",
														
 
															+        "device": "cpu"
														
 
															+    },
														
 
															+    # 可扩展其他向量模型
														
 
															+}
														
 
															 class Database:
														
 
															     def __init__(self, db_type: str = "pg"):
														
--- a/landsite_agent/examples.json
+++ b/landsite_agent/examples.json
@@ -28,5 +28,10 @@
 
															     "query_type": "land_site_selection",
														
 
															     "query": "帮我在温州南站附近推荐几块50亩左右的工业用地,温州南站的坐标为120.58,27.97,数据表是控制性详细规划",
														
 
															     "sql_code": "select t.id from (select id,ydmj,round(st_distance(st_geometryfromtext('POINT (120.58 27.97)', 4490)::geography,shape::geography)::numeric,0) as distance from sde.kzxxxgh where ydxz like '%工业%'  and shape is not null and abs(ydmj - 50*0.0667) <= 1) as t where t.distance <= 10000  order by t.ydmj nulls last limit 5"
														
 
															+  },
														
 
															+  {
														
 
															+    "query_type": "land_site_selection",
														
 
															+    "query": "请在萧山区找出面积最大的商业用地,数据表是控制性详细规划",
														
 
															+    "sql_code": "SELECT id FROM sde.kzxxxgh WHERE xzqmc = '萧山区' AND ydxz LIKE '%商业%' AND shape IS NOT NUL ORDER BY ydmj DESC LIMIT 1;"
														
 
															   }
														
 
															 ] 
														
--- a/landsite_agent/main.py
+++ b/landsite_agent/main.py
@@ -1,16 +1,15 @@
 
															 from fastapi import FastAPI, HTTPException
														
 
															 from fastapi.middleware.cors import CORSMiddleware
														
 
															 from pydantic import BaseModel
														
 
															-import pandas as pd
														
 
															-import plotly.express as px
														
 
															 import json
														
 
															 from fastapi.responses import StreamingResponse
														
 
															 from typing import AsyncGenerator, List, Dict, Any
														
 
															 import uvicorn
														
 
															 import traceback
														
 
															-import asyncio
														
 
															 from xuanzhi_query import router as xz_router
														
 
															 from sql_generator import SQLGenerator
														
 
															+from config import DEFAULT_MODEL_TYPE
														
 
															+import re
														
 
															 app = FastAPI(title="Land Analysis API")
														
 
															 app.include_router(xz_router)
														
@@ -35,15 +34,18 @@ class AnalysisResult(BaseModel):
 
															     similar_examples: List[Dict[str, Any]] = None
														
 
															-sql_generator = SQLGenerator()
														
 
															-
														
 
															-
														
 
															 @app.post("/land_analysis/stream")
														
 
															 async def stream_land_analysis(request: QueryRequest):
														
 
															     """
														
 
															     流式返回土地分析结果
														
 
															     """
														
 
															+    def remove_think_tag(text: str) -> str:
														
 
															+        # 移除<think>标签及其内容
														
 
															+        return re.sub(r"<think>[\s\S]*?</think>\\n*", "", text)
														
 
															+
														
 
															+    sql_generator = SQLGenerator(model_type=DEFAULT_MODEL_TYPE)
														
 
															+
														
 
															     async def generate_stream() -> AsyncGenerator[str, None]:
														
 
															         try:
														
 
															             similar_examples = None
														
@@ -56,9 +58,13 @@ async def stream_land_analysis(request: QueryRequest):
 
															                     similar_examples = data["content"]
														
 
															                     yield chunk
														
 
															                 elif data["type"] == "sql_generation":
														
 
															+                    # zjstai模型时，移除<think>标签内容
														
 
															+                    # if DEFAULT_MODEL_TYPE == "zjstai":
														
 
															+                    #     data["content"] = remove_think_tag(data["content"])
														
 
															+                    #     yield json.dumps(data, ensure_ascii=False) + "\n"
														
 
															+                    # else:
														
 
															                     yield chunk
														
 
															                 elif data["type"] == "sql_result":
														
 
															-                    # 获取到完整的SQL后执行
														
 
															                     sql = data["content"]
														
 
															                     result = await sql_generator.execute_sql(sql)
														
@@ -69,7 +75,6 @@ async def stream_land_analysis(request: QueryRequest):
 
															                         }, ensure_ascii=False) + "\n"
														
 
															                         return
														
 
															-                    # 返回最终结果
														
 
															                     yield json.dumps({
														
 
															                         "type": "result",
														
 
															                         "data": {
														
@@ -93,48 +98,13 @@ async def stream_land_analysis(request: QueryRequest):
 
															     )
														
 
															-@app.post("/land_analysis", response_model=AnalysisResult)
														
 
															-async def generate_and_execute_sql(request: QueryRequest):
														
 
															-    try:
														
 
															-        # 获取相似示例
														
 
															-        similar_examples = sql_generator._get_similar_examples(request.description)
														
 
															-
														
 
															-        # 构建增强提示词
														
 
															-        enhanced_prompt = f"""
														
 
															-        基于以下相似示例：
														
 
															-        {json.dumps(similar_examples, ensure_ascii=False, indent=2)}
														
 
															-        
														
 
															-        请根据以下描述生成SQL查询：
														
 
															-        {request.description}
														
 
															-        """
														
 
															-
														
 
															-        # 生成SQL
														
 
															-        sql = await sql_generator.chain.arun(enhanced_prompt)
														
 
															-
														
 
															-        # 执行SQL
														
 
															-        result = await sql_generator.execute_sql(sql)
														
 
															-
														
 
															-        if result["status"] == "error":
														
 
															-            raise HTTPException(status_code=400, detail=result["message"])
														
 
															-
														
 
															-        return AnalysisResult(
														
 
															-            sql=sql,
														
 
															-            exec_result=result["data"]
														
 
															-        )
														
 
															-
														
 
															-    except Exception as e:
														
 
															-        traceback.print_exc()
														
 
															-        raise HTTPException(status_code=500, detail=str(e))
														
 
															-
														
 
															-
														
 
															 @app.on_event("shutdown")
														
 
															 async def shutdown_event():
														
 
															     """
														
 
															     应用关闭时清理资源
														
 
															     """
														
 
															-    await sql_generator.close()
														
 
															+    pass
														
 
															 if __name__ == "__main__":
														
 
															     uvicorn.run(app, host="0.0.0.0", port=8521)
														
 
															-
														
--- a/landsite_agent/requirements.txt
+++ b/landsite_agent/requirements.txt
--- a/landsite_agent/sql_generator.py
+++ b/landsite_agent/sql_generator.py
@@ -1,17 +1,15 @@
 
															 from langchain_openai import ChatOpenAI
														
 
															 from langchain.prompts import ChatPromptTemplate
														
 
															 from langchain_core.output_parsers import StrOutputParser
														
 
															-from langchain_core.runnables import RunnablePassthrough
														
 
															 from langchain_core.documents import Document
														
 
															 from langchain_huggingface.embeddings.huggingface import HuggingFaceEmbeddings
														
 
															 from langchain_community.vectorstores import FAISS
														
 
															-import os
														
 
															 from prompt_template import get_prompt
														
 
															 import json
														
 
															 import traceback
														
 
															 from config import get_model_config
														
 
															 from typing import List, Dict, Any
														
 
															-from database import Database
														
 
															+from database import Database, vector_model_config
														
 
															 import re
														
 
															 class SQLGenerator:
														
@@ -42,10 +40,11 @@ class SQLGenerator:
 
															         )
														
 
															         # 初始化本地m3e-base模型
														
 
															-        self.model_path = r"E:\项目临时\AI大模型\m3e-base"
														
 
															+        model_cfg = vector_model_config["m3e-base"]
														
 
															+        self.model_path = model_cfg["model_path"]
														
 
															         self.embeddings = HuggingFaceEmbeddings(
														
 
															             model_name=self.model_path,
														
 
															-            model_kwargs={'device': 'cpu'},
														
 
															+            model_kwargs={'device': model_cfg["device"]},
														
 
															             encode_kwargs={'normalize_embeddings': True}
														
 
															         )
														
@@ -138,7 +137,7 @@ class SQLGenerator:
 
															         """
														
 
															         try:
														
 
															             # 开始生成SQL
														
 
															-            yield json.dumps({"type": "start", "message": "开始生成SQL查询..."}, ensure_ascii=False) + "\n"
														
 
															+            yield json.dumps({"type": "start", "content": "开始生成SQL查询..."}, ensure_ascii=False) + "\n"
														
 
															             # 获取相似示例
														
 
															             similar_examples = self._get_similar_examples(query_description)
														
@@ -203,19 +202,19 @@ class SQLGenerator:
 
															                         "content": full_response
														
 
															                     }, ensure_ascii=False) + "\n"
														
 
															-                yield json.dumps({"type": "end", "message": "SQL生成完成"}, ensure_ascii=False) + "\n"
														
 
															+                yield json.dumps({"type": "end", "content": "SQL生成完成"}, ensure_ascii=False) + "\n"
														
 
															             except Exception as e:
														
 
															                 print(f"Error details: {traceback.format_exc()}")
														
 
															                 yield json.dumps({
														
 
															                     "type": "error",
														
 
															-                    "message": f"生成SQL时发生错误: {str(e)}"
														
 
															+                    "content": f"生成SQL时发生错误: {str(e)}"
														
 
															                 }, ensure_ascii=False) + "\n"
														
 
															         except Exception as e:
														
 
															             traceback.print_exc()
														
 
															             yield json.dumps({
														
 
															                 "type": "error",
														
 
															-                "message": str(e)
														
 
															+                "content": str(e)
														
 
															             }, ensure_ascii=False) + "\n"
														
 
															     async def execute_sql(self, sql: str) -> dict: