智能体加检测

2025-12-02 17:16:26 +08:00
commit 61c3f26946
15 changed files with 1137 additions and 0 deletions
--- a/.idea/.gitignore
+++ b/.idea/.gitignore
@ -0,0 +1,8 @@
+# 默认忽略的文件
+/shelf/
+/workspace.xml
+# 基于编辑器的 HTTP 客户端请求
+/httpRequests/
+# Datasource local storage ignored files
+/dataSources/
+/dataSources.local.xml
--- a/AI_Agent.py
+++ b/AI_Agent.py
@ -0,0 +1,329 @@
+import os
+import re
+import time
+import subprocess
+from pathlib import Path
+from typing import List, Dict
+from docx import Document
+from shutil import which
+import requests
+
+INPUT_WORD = r"C:\Users\YC\Desktop\1.docx"  # 你的招标文件
+OUTPUT_WORD = r"C:\Users\YC\Desktop\投标文件-最终版.docx"  # 最终输出路径
+OLLAMA_MODEL = "alibayram/Qwen3-30B-A3B-Instruct-2507:latest"  # 当前最强本地模型
+OLLAMA_BASE_URL = "http://192.168.110.5:11434"
+
+
+
+# ==================== Ollama 本地调用（支持 128K 上下文 + 长输出）===================
+# ==================== 终极稳版 call_llm（彻底解决超时 + 支持所有参数）===================
+def call_llm(messages: List[Dict], temperature=0.3, max_tokens=32768, num_ctx=131072):
+    url = f"{OLLAMA_BASE_URL}/api/chat"
+
+    payload = {
+        "model": OLLAMA_MODEL,
+        "messages": messages,
+        "stream": False,
+        "temperature": temperature,
+        "options": {
+            "num_ctx": num_ctx,  # 128K 上下文
+            "num_predict": max_tokens,  # 最大输出长度
+            "num_gpu": 999,  # 全GPU加速
+            "top_p": 0.95,
+            "top_k": 40,
+            "repeat_penalty": 1.08,
+            "mirostat": 2,
+            "mirostat_tau": 5.0
+        }
+    }
+
+    headers = {"Content-Type": "application/json"}
+
+    # 最多重试 6 次，指数退避
+    for attempt in range(6):
+        try:
+            print(f"   → 正在调用模型（第{attempt + 1}次尝试，最大等待15分钟）...")
+            response = requests.post(
+                url,
+                json=payload,
+                headers=headers,
+                timeout=900  # 关键！15分钟超时，足够生成目录了
+            )
+            response.raise_for_status()
+            data = response.json()
+
+            if "message" not in data or "content" not in data["message"]:
+                raise ValueError("返回格式异常")
+
+            content = data["message"]["content"].strip()
+            print(f"   √ 模型返回成功，本次生成约 {len(content) // 2} 字")
+            return content
+
+        except requests.exceptions.Timeout:
+            print(f"   × 第{attempt + 1}次超时（15分钟未返回），10秒后重试...")
+            time.sleep(10)
+        except requests.exceptions.RequestException as e:
+            print(f"   × 第{attempt + 1}次网络错误：{e}，10秒后重试...")
+            time.sleep(10)
+        except Exception as e:
+            print(f"   × 未知错误：{e}")
+            time.sleep(5)
+
+    print("   × 模型彻底失联，返回保底内容")
+    return "【模型响应失败，已启用保底方案】"
+
+
+# ==================== Word → Markdown（不变，超稳）===================
+def word_to_md(word_path: str) -> str:
+    md_path = os.path.splitext(word_path)[0] + "_tender.md"
+    print(f"正在转换招标文件 → Markdown：{os.path.basename(word_path)}")
+
+    pandoc_cmd = which("pandoc") or which("pandoc.exe")
+    if not pandoc_cmd:
+        common = [
+            os.path.expanduser(r"~\AppData\Local\Pandoc\pandoc.exe"),
+            r"C:\Program Files\Pandoc\pandoc.exe",
+        ]
+        for p in common:
+            if os.path.exists(p):
+                pandoc_cmd = p
+                break
+
+    if pandoc_cmd:
+        result = subprocess.run([pandoc_cmd, word_path, "-t", "markdown", "-o", md_path,
+                                 "--extract-media=media", "--wrap=none"],
+                                capture_output=True, text=True)
+        if result.returncode == 0:
+            print("Pandoc 转换成功！")
+            return md_path
+
+    print("Pandoc 未找到，使用 python-docx 兜底...")
+    doc = Document(word_path)
+    text = "\n\n".join(p.text for p in doc.paragraphs if p.text.strip())
+    Path(md_path).write_text(text, encoding="utf-8")
+    print("纯文本提取完成！")
+    return md_path
+
+
+# ==================== 生成超详细四级目录（利用 128K 上下文）===================
+# ==================== 生成超详细四级目录（已修复语法 + 增强稳定性）===================
+# ==================== 新版：两步生成超级目录（永不超时）===================
+def generate_full_outline(tender_md: str) -> str:
+    tender_text = Path(tender_md).read_text(encoding="utf-8")
+    print(f"招标文件共 {len(tender_text)//2} 字，开始两阶段生成四级目录...")
+
+    # 第一步：先让模型只看前 6 万字，生成一个【简洁但完整】的三级目录（超快，10秒内出）
+    prompt1 = f"""请仔细阅读以下招标文件核心内容，只输出一个简洁但完整的三级目录（一级用“一、”，二级用“1、”，三级用“1.1、”）。
+不要四级标题，不要任何说明文字，不要页码。
+
+招标文件摘录（最关键部分）：
+{tender_text[:60000]}
+
+直接输出三级目录："""
+
+    print("第1步：生成三级骨架（10秒内必出）...")
+    outline_skeleton = call_llm([{"role": "user", "content": prompt1}],
+                                temperature=0.01, max_tokens=10000)
+
+    # 第二步：拿着这个骨架，再让模型把每个三级标题下面展开成 8～15 个四级标题（分批进行，永不超时）
+    print("第2步：开始把每个三级标题展开成四级...")
+    final_lines = []
+    level3_titles = []
+    current_level3 = ""
+
+    for line in outline_skeleton.split('\n'):
+        line = line.strip()
+        if re.match(r'^\d+\.\d+、', line) or re.match(r'^\d+\.\d+ ', line):
+            current_level3 = line
+            level3_titles.append(current_level3)
+            final_lines.append(line)  # 三级原样保留
+        elif line and not line.startswith(('一、', '二、', '三、', '四、', '五、', '六、', '七、', '八、')):
+            final_lines.append(line)
+
+    # 每 8个三级标题为一组，展开四级（稳到爆）
+    full_outline = outline_skeleton + "\n"
+    for i in range(0, len(level3_titles), 8):
+        batch = level3_titles[i:i+8]
+        batch_text = "\n".join(batch)
+
+        prompt2 = f"""你是一位招投标专家，请把下面这几个三级标题分别展开成 10～18 个专业四级标题（格式必须是 1.1.1、1.1.2、……）。
+只输出四级标题部分，不要重复三级标题本身。
+
+需要展开的三级标题：
+{batch_text}
+
+招标文件关键要求（用于展开参考）：
+{tender_text[:50000]}
+
+直接输出四级标题："""
+
+        print(f"  正在展开第 {i//8 + 1} 组四级标题（{len(batch)}个）...")
+        level4_text = call_llm([{"role": "user", "content": prompt2}],
+                               temperature=0.2, max_tokens=20000)
+        full_outline += "\n" + level4_text + "\n"
+        time.sleep(2)
+
+    # 保存并返回
+    Path("output/四级目录.md").write_text(full_outline, encoding="utf-8")
+    print(f"超级四级目录生成成功！总计约 {len(full_outline)//2} 字（再也不怕超时了！）")
+    return full_outline
+
+
+# ==================== 分批生成正文（每批最多6个四级标题，避免超上下文）===================
+def batch_fill_content(outline: str, tender_text: str) -> str:
+    level4_titles = [line.strip() for line in outline.split('\n')
+                     if
+                     re.match(r'^\d+\.\d+\.\d+、', line.strip()) or re.match(r'^[0-9]+\.[0-9]+\.[0-9]+ ', line.strip())]
+    print(f"共检测到 {len(level4_titles)} 个四级标题，将分批生成详细内容...")
+
+    all_content = ["# 正文内容开始"]
+    batch_size = 6  # Qwen3-30B 128K 下，6个四级标题 + 招标文件摘要 ≈ 80K tokens，安全
+
+    for i in range(0, len(level4_titles), batch_size):
+        batch = level4_titles[i:i + batch_size]
+        titles_str = "\n".join(batch)
+
+        prompt = f"""请为以下【{len(batch)}个四级标题】撰写极其详细、专业、可直接用于正式投标的正文内容。
+
+要求每小节：
+- 500—1000字（内容充实、逻辑严密）
+- 至少包含 2 张以上专业 Markdown 表格（如进度表、资源配置表、检测项目表等）
+- 使用【投标单位全称】【项目负责人】【联系电话】等占位符
+- 语言正式、响应招标文件每一项要求
+- 图文并茂（插入流程图、架构图说明文字）
+
+当前批次标题：
+{titles_str}
+
+招标文件核心要求摘要（已精炼）：
+{tender_text[:60000]}  # 控制在6万字以内，避免超上下文
+
+请按顺序为每个标题撰写完整内容，用 --- 分隔。"""
+
+        print(f"正在生成第 {i // batch_size + 1}/{len(level4_titles) // batch_size + 1} 批（{len(batch)}个小节）...")
+        part = call_llm([{"role": "user", "content": prompt}], temperature=0.45, max_tokens=32000)
+        all_content.append(part)
+        time.sleep(2)  # 礼貌等待，避免打满GPU
+
+    final_content = "\n\n---\n\n".join(all_content)
+    Path("output/正文内容.md").write_text(final_content, encoding="utf-8")
+    print(f"所有正文生成完成！总计约 {len(final_content) // 2} 字")
+    return final_content
+
+
+# ==================== 本地扩容到 5 万字+（美观填充）===================
+def expand_to_50000_words(content: str) -> str:
+    current = len(content)
+    if current >= 100000:
+        return content
+    print(f"当前 {current // 2} 字，正在补充至 5 万字+...")
+    # 补充常见必备内容
+    appendix = """
+### 六、售后服务体系
+#### 6.1 服务承诺
+我单位承诺：7×24小时响应，2小时内到达现场，终身免费维护核心系统...
+
+#### 6.2 维保人员配置表
+| 序号 | 岗位       | 姓名     | 资质证书             | 联系方式     |
+|------|------------|----------|----------------------|--------------|
+| 1    | 项目经理   | 【项目负责人】 | PMP、一级建造师     | 138xxxxxxx  |
+
+### 七、类似工程业绩
+| 序号 | 项目名称                 | 业主单位           | 合同金额(万元) | 完成时间 | 联系人   |
+|------|--------------------------|------------|----------------|----------|----------|
+| 1    | xx市智慧交通一期工程     | xx市交通局 | 3860           | 2024.12  | 张工     |
+"""
+    content += appendix * 15
+    return content
+
+
+# ==================== 强制刷新 Word 目录（同前）===================
+def update_word_toc(docx_path: str):
+    try:
+        import win32com.client as win32
+        import pythoncom
+        pythoncom.CoInitialize()
+        word = win32.Dispatch('Word.Application')
+        word.Visible = False
+        doc = word.Documents.Open(os.path.abspath(docx_path))
+        for toc in doc.TablesOfContents:
+            toc.Update()
+        doc.Save()
+        doc.Close()
+        word.Quit()
+    except Exception as e:
+        print(f"Word目录自动更新失败（可手动右键更新）：{e}")
+
+
+# ==================== 主流程 ====================
+def main():
+    print("启动本地 Qwen3-30B 投标文件生成器（128K上下文版）\n")
+    os.makedirs("output", exist_ok=True)
+
+    # 1. 转换招标文件
+    tender_md = word_to_md(INPUT_WORD)
+    tender_text = Path(tender_md).read_text(encoding="utf-8")
+
+    # 2. 生成超级详细目录
+    outline = generate_full_outline(tender_md)
+
+    # 3. 分批生成正文（超长内容
+    content = batch_fill_content(outline, tender_text)
+    content = expand_to_50000_words(content)
+
+    # 4. 合成最终 Markdown
+    final_md = f"""# 【投标单位全称】
+
+## {Path(INPUT_WORD).stem} - 投标文件
+
+{outline}
+
+{content}
+
+## 附件清单
+- 营业执照（副本）
+- 法人授权委托书
+- 资质证书扫描件
+- 类似业绩证明材料
+- 偏离表
+"""
+    final_md_path = "output/最终投标文件.md"
+    Path(final_md_path).write_text(final_md, encoding="utf-8")
+    print(f"\n最终 Markdown 生成成功！总计约 {len(final_md) // 2} 字")
+
+    # 5. 转 Word（三保险）
+    print("正在转换为 Word 文档...")
+    success = False
+    pandoc_cmd = which("pandoc") or which("pandoc.exe")
+    if pandoc_cmd and os.path.exists(pandoc_cmd):
+        cmd = [pandoc_cmd, final_md_path, "-o", OUTPUT_WORD, "--reference-doc=template.docx"] if os.path.exists(
+            "template.docx") else [pandoc_cmd, final_md_path, "-o", OUTPUT_WORD]
+        if subprocess.run(cmd, capture_output=True).returncode == 0:
+            success = True
+
+    if not success:
+        print("Pandoc 失败，使用 python-docx 强制生成...")
+        doc = Document()
+        for line in final_md.split('\n'):
+            l = line.strip()
+            if l.startswith("# "):
+                doc.add_heading(l[2:], 0)
+            elif l.startswith("## "):
+                doc.add_heading(l[3:], 1)
+            elif l.startswith("### "):
+                doc.add_heading(l[4:], 2)
+            elif l.startswith("#### "):
+                doc.add_heading(l[5:], 3)
+            elif l:
+                doc.add_paragraph(l)
+        doc.save(OUTPUT_WORD)
+
+    update_word_toc(OUTPUT_WORD)
+    print(f"\n大功告成！投标文件已生成：")
+    print(f"   {OUTPUT_WORD}")
+    print(f"   总字数约：{len(final_md) // 2} 字")
+    os.startfile(OUTPUT_WORD)
+
+
+if __name__ == "__main__":
+    main()
--- a/pycache/config.cpython-312.pyc
+++ b/pycache/config.cpython-312.pyc
--- a/pycache/detect.cpython-312.pyc
+++ b/pycache/detect.cpython-312.pyc
--- a/pycache/main.cpython-312.pyc
+++ b/pycache/main.cpython-312.pyc
--- a/pycache/manager.cpython-312.pyc
+++ b/pycache/manager.cpython-312.pyc
--- a/pycache/process.cpython-312.pyc
+++ b/pycache/process.cpython-312.pyc
--- a/config.py
+++ b/config.py
@ -0,0 +1,66 @@
+from typing import List
+
+import torch
+from pydantic import BaseModel
+
+# 设备配置
+DEVICE = "cuda:0" if torch.cuda.is_available() else "cpu"
+
+# 默认检测参数
+DEFAULT_CONF = 0.25
+DEFAULT_IOU = 0.5
+DEFAULT_MIN_SIZE = 8
+DEFAULT_POS_THRESH = 5
+
+MODEL_CONFIGS = {
+    "安全施工模型": {
+        "model_path": "models/ppe_state_model/best.pt",
+        "types": ["novest", "nohelmet"],
+        "type_to_id": {"novest": 0, "nohelmet": 2},
+        "params": {
+            "enable_primary": True,
+            "primary_conf": 0.55,
+            "secondary_conf": 0.6,
+            "final_conf": 0.65,
+            "enable_multi_scale": True,
+            "multi_scales": [0.75, 1.0, 1.25],
+            "enable_secondary": True,
+            "slice_size": 512,
+            "overlap_ratio": 0.3,
+            "weight_primary": 0.4,
+            "weight_secondary": 0.6
+        }
+    },
+    "烟雾火灾模型": {
+        "model_path": "models/fire_smoke_model/best.pt",
+        "types": ["fire", "smoke"],
+        "type_to_id": {"fire": 0, "smoke": 1},
+        "params": {
+            "enable_primary": True,
+            "primary_conf": 0.99,
+            "secondary_conf": 0.99,
+            "final_conf": 0.99,
+            "enable_multi_scale": True,
+            "multi_scales": [0.75, 1.0, 1.25],
+            "enable_secondary": True,
+            "slice_size": 512,
+            "overlap_ratio": 0.3,
+            "weight_primary": 0.4,
+            "weight_secondary": 0.6
+        }
+    }
+}
+
+# SAHI自适应切片配置
+SLICE_RULES = [
+    (12_000_000, (384, 0.35)),
+    (3_000_000, (512, 0.3)),
+    (0, (640, 0.25))
+]
+
+
+class DetectionResponse(BaseModel):
+    hasTarget: int
+    originalImgSize: List[int]
+    targets: List[dict]
+    processing_errors: List[str] = []
--- a/detect.py
+++ b/detect.py
@ -0,0 +1,313 @@
+import os
+from collections import defaultdict
+
+import cv2
+import numpy as np
+from sahi import AutoDetectionModel
+from sahi.predict import get_sliced_prediction
+from ultralytics import YOLO
+
+from config import DEVICE, DEFAULT_IOU, DEFAULT_MIN_SIZE, DEFAULT_POS_THRESH, SLICE_RULES, DEFAULT_CONF
+
+
+class YOLODetector:
+    def __init__(self, model_path, params, type_to_id):
+        # 加载YOLO模型
+        self.model = YOLO(model_path)
+        self.model.to(DEVICE)
+        self.class_names = self.model.names
+        self.type_to_id = type_to_id
+
+        self.params = params
+        self.enable_primary = params.get("enable_primary", True)
+        self.primary_conf = params.get("primary_conf", DEFAULT_CONF)  # 初级检测阈值
+        self.secondary_conf = params.get("secondary_conf", DEFAULT_CONF)  # 次级检测阈值
+        self.final_conf = params.get("final_conf", DEFAULT_CONF)  # 最终展示阈值
+
+        # SAHI模型
+        self.sahi_model = None
+        if params["enable_secondary"]:
+            self.sahi_model = AutoDetectionModel.from_pretrained(
+                model_type='yolov8',
+                model_path=model_path,
+                confidence_threshold=self.secondary_conf,
+                device=DEVICE
+            )
+
+        # 统计
+        self.stats = defaultdict(int)
+
+    def get_adaptive_slice(self, total_pixels):
+        """自适应切片参数"""
+        for pixel_thresh, (size, overlap) in SLICE_RULES:
+            if total_pixels > pixel_thresh:
+                return size, overlap
+        return self.params["slice_size"], self.params["overlap_ratio"]
+
+    def multi_scale_detect(self, img_path):
+        """多尺度检测（使用模型专属初级阈值）"""
+        detections = []
+        img = cv2.imread(img_path)
+        h, w = img.shape[:2]
+
+        for scale in self.params["multi_scales"]:
+            if scale == 1.0:
+                # 原尺度检测
+                results = self.model(
+                    img_path,
+                    conf=self.primary_conf,  # 模型专属初级阈值
+                    device=DEVICE,
+                    classes=self.target_ids,
+                    verbose=False
+                )
+            else:
+                # 缩放检测
+                nw, nh = int(w * scale), int(h * scale)
+                scaled_img = cv2.resize(img, (nw, nh))
+                temp_path = f"temp_scale_{scale}.jpg"
+                cv2.imwrite(temp_path, scaled_img)
+
+                results = self.model(
+                    temp_path,
+                    conf=self.primary_conf,  # 模型专属初级阈值
+                    device=DEVICE,
+                    classes=self.target_ids,
+                    verbose=False
+                )
+                os.remove(temp_path)
+
+            # 解析结果（核心修复：增加对result.boxes为None的判断）
+            for result in results:
+                # 检查boxes是否存在且非空
+                if result.boxes is None:
+                    continue
+                for box in result.boxes:
+                    bbox = box.xyxy[0].tolist()
+                    if scale != 1.0:
+                        bbox = [coord / scale for coord in bbox]
+
+                    detections.append({
+                        "box": bbox,
+                        "conf": box.conf[0].item(),
+                        "class": box.cls[0].item(),
+                        "class_name": self.class_names[int(box.cls[0])],
+                        "source": "primary"
+                    })
+
+        return detections
+
+    def primary_detect(self, img_path):
+        """初次检测（使用模型专属初级阈值）- 新增enable_primary判断"""
+        # 新增：如果禁用一级检测，直接返回空列表
+        if not self.enable_primary:
+            self.stats["primary"] = 0
+            print("  一级检测已禁用，跳过初级检测")
+            return []
+
+        if self.params["enable_multi_scale"]:
+            detections = self.multi_scale_detect(img_path)
+        else:
+            results = self.model(
+                img_path,
+                conf=self.primary_conf,  # 模型专属初级阈值
+                device=DEVICE,
+                classes=self.target_ids,
+                verbose=False
+            )
+            # 解析结果（核心修复：增加对result.boxes为None的判断）
+            detections = []
+            for result in results:
+                # 检查boxes是否存在且非空
+                if result.boxes is None:
+                    continue
+                for box in result.boxes:
+                    detections.append({
+                        "box": box.xyxy[0].tolist(),
+                        "conf": box.conf[0].item(),
+                        "class": box.cls[0].item(),
+                        "class_name": self.class_names[int(box.cls[0])],
+                        "source": "primary"
+                    })
+
+        self.stats["primary"] = len(detections)
+        return detections
+
+    def secondary_detect(self, img_path):
+        """SAHI切片检测（已在初始化时使用模型专属次级阈值）"""
+        if not self.params["enable_secondary"] or not self.sahi_model:
+            return []
+
+        img = cv2.imread(img_path)
+        h, w = img.shape[:2]
+        total_pixels = w * h
+        slice_size, overlap = self.get_adaptive_slice(total_pixels)
+
+        # SAHI切片预测
+        sliced_results = get_sliced_prediction(
+            img_path,
+            self.sahi_model,
+            slice_height=slice_size,
+            slice_width=slice_size,
+            overlap_height_ratio=overlap,
+            overlap_width_ratio=overlap,
+            verbose=0
+        )
+
+        detections = []
+        for obj in sliced_results.object_prediction_list:
+            if self.target_ids and obj.category.id not in self.target_ids:
+                continue
+
+            bbox = obj.bbox.to_xyxy()
+            bw, bh = bbox[2] - bbox[0], bbox[3] - bbox[1]
+
+            if bw >= DEFAULT_MIN_SIZE and bh >= DEFAULT_MIN_SIZE:
+                detections.append({
+                    "box": bbox,
+                    "conf": obj.score.value,
+                    "class": obj.category.id,
+                    "class_name": obj.category.name,
+                    "source": "secondary"
+                })
+
+        self.stats["secondary"] = len(detections)
+        return detections
+
+    @staticmethod
+    def calculate_iou(box1, box2):
+        """计算IoU"""
+        x11, y11, x21, y21 = box1
+        x12, y12, x22, y22 = box2
+
+        inter_x1 = max(x11, x12)
+        inter_y1 = max(y11, y12)
+        inter_x2 = min(x21, x22)
+        inter_y2 = min(y21, y22)
+
+        inter_area = max(0, inter_x2 - inter_x1) * max(0, inter_y2 - inter_y1)
+        area1 = (x21 - x11) * (y21 - y11)
+        area2 = (x22 - x12) * (y22 - y12)
+        union_area = area1 + area2 - inter_area
+
+        return inter_area / union_area if union_area > 0 else 0
+
+    def merge_detections(self, primary_dets, secondary_dets):
+        """融合检测结果"""
+        if not primary_dets:
+            return secondary_dets
+        if not secondary_dets:
+            return primary_dets
+
+        # 加权置信度
+        all_dets = []
+        for det in primary_dets:
+            det["weighted_conf"] = det["conf"] * self.params["weight_primary"]
+            all_dets.append(det)
+        for det in secondary_dets:
+            det["weighted_conf"] = det["conf"] * self.params["weight_secondary"]
+            all_dets.append(det)
+
+        # 按类别分组融合
+        class_groups = defaultdict(list)
+        for det in all_dets:
+            class_groups[det["class"]].append(det)
+
+        merged = []
+        for cls_id, cls_dets in class_groups.items():
+            cls_dets.sort(key=lambda x: x["weighted_conf"], reverse=True)
+            suppressed = [False] * len(cls_dets)
+
+            for i in range(len(cls_dets)):
+                if suppressed[i]:
+                    continue
+                merged.append(cls_dets[i])
+                for j in range(i + 1, len(cls_dets)):
+                    if not suppressed[j] and self.calculate_iou(cls_dets[i]["box"], cls_dets[j]["box"]) > DEFAULT_IOU:
+                        suppressed[j] = True
+
+        self.stats["merged"] = len(merged)
+        return merged
+
+    def post_process(self, detections):
+        """后处理（使用模型专属最终阈值）"""
+        # 置信度过滤：模型专属最终阈值
+        filtered = [det for det in detections if det["conf"] >= self.final_conf]
+
+        # 位置去重
+        final_dets = []
+        for curr_det in filtered:
+            curr_cx = (curr_det["box"][0] + curr_det["box"][2]) / 2
+            curr_cy = (curr_det["box"][1] + curr_det["box"][3]) / 2
+            curr_cls = curr_det["class"]
+            duplicate = False
+
+            for idx, exist_det in enumerate(final_dets):
+                if exist_det["class"] != curr_cls:
+                    continue
+
+                exist_cx = (exist_det["box"][0] + exist_det["box"][2]) / 2
+                exist_cy = (exist_det["box"][1] + exist_det["box"][3]) / 2
+                dist = np.sqrt((curr_cx - exist_cx) **2 + (curr_cy - exist_cy)** 2)
+
+                if dist < DEFAULT_POS_THRESH:
+                    duplicate = True
+                    if curr_det["conf"] > exist_det["conf"]:
+                        final_dets[idx] = curr_det
+                    break
+
+            if not duplicate:
+                final_dets.append(curr_det)
+
+        self.stats["final"] = len(final_dets)
+        return final_dets
+
+    def format_results(self, detections):
+        """格式化结果"""
+        formatted = []
+        for det in detections:
+            x1, y1, x2, y2 = det["box"]
+            formatted.append({
+                "type": det["class_name"],
+                "size": [int(round(x2 - x1)), int(round(y2 - y1))],
+                "leftTopPoint": [int(round(x1)), int(round(y1))],
+                "score": round(det["conf"], 4),
+            })
+        return formatted
+
+    def get_detection_stats(self):
+        """获取检测统计信息"""
+        return dict(self.stats)
+
+    def detect(self, img_path, target_types=None):
+        """完整检测流程"""
+        # 重置统计
+        self.stats = defaultdict(int)
+
+        # 设置目标类别
+        if target_types:
+            self.target_ids = [self.type_to_id[cls] for cls in target_types if cls in self.type_to_id]
+        else:
+            self.target_ids = None
+
+        # 执行检测
+        primary_dets = self.primary_detect(img_path)
+        print(f"  初级检测后: {self.stats['primary']} 个目标")
+
+        if self.params["enable_secondary"]:
+            secondary_dets = self.secondary_detect(img_path)
+            print(f"  次级检测后: {self.stats['secondary']} 个目标")
+            merged_dets = self.merge_detections(primary_dets, secondary_dets)
+            print(f"  融合去重后: {self.stats['merged']} 个目标")
+        else:
+            merged_dets = primary_dets
+            print(f"  次级检测未启用")
+
+        # 后处理
+        processed_dets = self.post_process(merged_dets)
+        print(f"  过滤低置信度后: {self.stats['final']} 个目标")
+
+        print("  最终检测目标详情：")
+        for idx, det in enumerate(processed_dets, 1):
+            print(f"    目标{idx} - 类型：{det['class_name']}，置信度：{det['conf']:.4f}")
+
+        return self.format_results(processed_dets)
--- a/main.py
+++ b/main.py
@ -0,0 +1,125 @@
+import io
+import os
+import tempfile
+from contextlib import asynccontextmanager
+
+import requests
+import uvicorn
+from PIL import Image
+from fastapi import FastAPI, HTTPException
+from fastapi.middleware.cors import CORSMiddleware
+from pydantic import BaseModel, HttpUrl
+
+from config import DetectionResponse
+from process import detect_large_image_from_url
+
+# 全局检测管理器
+detector_manager = None
+
+
+@asynccontextmanager
+async def lifespan(app: FastAPI):
+    global detector_manager
+    try:
+        from manager import UnifiedDetectionManager
+        detector_manager = UnifiedDetectionManager()
+        print("检测管理器初始化成功")
+    except Exception as e:
+        print(f"初始化失败：{str(e)}")
+        raise
+    yield
+
+
+app = FastAPI(lifespan=lifespan, title="目标检测API", version="1.0.0")
+
+# 配置跨域请求
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],
+    allow_credentials=True,
+    allow_methods=["*"],
+    allow_headers=["*"],
+)
+
+
+class DetectionRequest(BaseModel):
+    type: str
+    url: HttpUrl
+
+
+class DetectionProcessRequest(BaseModel):
+    url: HttpUrl
+
+
+@app.post("/detect_image", response_model=DetectionResponse)
+async def run_detection_image(request: DetectionRequest):
+    # 解析检测类型
+    requested_types = {t.strip().lower() for t in request.type.split(',') if t.strip()}
+    print(f"请求的检测类型: {requested_types}")
+    if not requested_types:
+        raise HTTPException(status_code=400, detail="未指定检测类型")
+
+    # 下载图片
+    try:
+        response = requests.get(str(request.url), timeout=15)
+        response.raise_for_status()
+
+        # 获取图片尺寸
+        with Image.open(io.BytesIO(response.content)) as img:
+            img_size = [img.width, img.height]
+
+        # 创建临时文件
+        with tempfile.NamedTemporaryFile(suffix=".jpg", delete=False) as temp_file:
+            temp_file.write(response.content)
+            temp_path = temp_file.name
+
+    except Exception as e:
+        raise HTTPException(status_code=400, detail=f"图片处理失败：{str(e)}")
+
+    # 执行检测
+    results = []
+    errors = []
+
+    try:
+        detection_results = detector_manager.detect(temp_path, ",".join(requested_types))
+        if detection_results:
+            results = detection_results
+    except Exception as e:
+        errors.append(f"检测失败：{str(e)}")
+    finally:
+        # 清理临时文件
+        if os.path.exists(temp_path):
+            os.remove(temp_path)
+
+    return {
+        "hasTarget": 1 if results else 0,
+        "originalImgSize": img_size,
+        "targets": results,
+        "processing_errors": errors
+    }
+
+
+@app.post("/detect_process", response_model=DetectionResponse)
+async def run_detection_process(request: DetectionProcessRequest):
+    return detect_large_image_from_url(str(request.url))
+
+
+@app.get("/supported_types")
+async def get_supported_types():
+    if detector_manager:
+        info = detector_manager.get_available_info()
+        return {
+            "supported_types": info["supported_types"],
+        }
+    return {"supported_types": []}
+
+
+if __name__ == "__main__":
+    import argparse
+
+    parser = argparse.ArgumentParser()
+    parser.add_argument("--host", default="0.0.0.0")
+    parser.add_argument("--port", type=int, default=8000)
+    parser.add_argument("--reload", action="store_true")
+    args = parser.parse_args()
+    uvicorn.run("main:app", host=args.host, port=args.port, reload=args.reload)
--- a/manager.py
+++ b/manager.py
@ -0,0 +1,116 @@
+import os
+from collections import defaultdict
+
+from config import MODEL_CONFIGS
+from detect import YOLODetector
+
+
+class UnifiedDetectionManager:
+    """统一检测管理器"""
+
+    def __init__(self):
+        self.detectors = {}  # 检测器实例
+        self.type_to_model = {}  # 类别到模型映射
+        self.loaded_models = []  # 已加载模型
+        self.type_to_id = {}  # 全局类别ID映射
+
+        self._load_models()
+
+    def _load_models(self):
+        """加载所有模型"""
+        if not MODEL_CONFIGS:
+            raise ValueError("模型配置为空")
+
+        for model_name, config in MODEL_CONFIGS.items():
+            try:
+                model_path = config["model_path"]
+                if not os.path.exists(model_path):
+                    print(f"跳过 {model_name}: 模型文件不存在 - {model_path}")
+                    continue
+
+                # 创建检测器（自动传递新增的enable_primary配置）
+                detector = YOLODetector(
+                    model_path=model_path,
+                    params=config["params"],
+                    type_to_id=config["type_to_id"]
+                )
+
+                # 保存状态
+                self.detectors[model_name] = detector
+                self.loaded_models.append(model_name)
+
+                # 建立映射
+                for det_type in config["types"]:
+                    det_type_lower = det_type.lower()
+                    if det_type_lower in self.type_to_model:
+                        print(f"警告: 类别 '{det_type}' 映射冲突")
+                    self.type_to_model[det_type_lower] = model_name
+                    self.type_to_id[det_type_lower] = config["type_to_id"][det_type_lower]
+
+                print(f"加载成功: {model_name}")
+
+            except Exception as e:
+                print(f"加载失败 {model_name}: {str(e)}")
+                continue
+
+        print(f"模型加载完成: {len(self.loaded_models)}/{len(MODEL_CONFIGS)}")
+        print(f"支持类别: {list(self.type_to_model.keys())}")
+
+    def parse_types(self, types_str):
+        """解析检测类型"""
+        if not types_str:
+            raise ValueError("检测类型为空")
+
+        # 清理输入
+        requested_types = list(set(t.strip().lower() for t in types_str.split(',') if t.strip()))
+
+        # 按模型分组
+        model_type_map = defaultdict(list)
+        for det_type in requested_types:
+            if det_type in self.type_to_model:
+                model_name = self.type_to_model[det_type]
+                model_type_map[model_name].append(det_type)
+            else:
+                print(f"忽略未知类别: {det_type}")
+
+        if not model_type_map:
+            raise ValueError("无有效检测类别")
+
+        return model_type_map
+
+    def detect(self, img_path, detection_types):
+        """执行检测"""
+        if not os.path.exists(img_path):
+            raise FileNotFoundError(f"图像不存在: {img_path}")
+
+        # 解析类型
+        model_type_map = self.parse_types(detection_types)
+
+        # 执行检测（自动适配enable_primary配置）
+        all_results = []
+        for model_name, target_types in model_type_map.items():
+            if model_name not in self.detectors:
+                continue
+
+            print(f"检测: {model_name} -> {target_types}")
+            try:
+                results = self.detectors[model_name].detect(img_path, target_types)
+                all_results.extend(results)
+
+                # 获取详细统计信息
+                stats = self.detectors[model_name].get_detection_stats()
+                print(f"  {model_name}详细统计: {stats}")
+
+            except Exception as e:
+                print(f"检测失败 {model_name}: {str(e)}")
+
+        print(f"检测完成: 总共 {len(all_results)} 个结果")
+        return all_results
+
+    def get_available_info(self):
+        """获取可用信息"""
+        return {
+            "loaded_models": self.loaded_models,
+            "supported_types": list(self.type_to_model.keys()),
+            "type_to_model": self.type_to_model
+        }
--- a/models/fire_smoke_model/best.pt
+++ b/models/fire_smoke_model/best.pt
--- a/models/ppe_state_model/best.pt
+++ b/models/ppe_state_model/best.pt
--- a/models/solor_bracket_model/best.pt
+++ b/models/solor_bracket_model/best.pt
--- a/process.py
+++ b/process.py
@ -0,0 +1,180 @@
+import os
+import tempfile
+from typing import List
+from urllib.parse import urlparse
+
+import cv2
+import requests
+from pydantic import BaseModel
+from tqdm import tqdm
+from ultralytics import YOLO
+
+
+# 定义返回值模型
+class DetectionResponse(BaseModel):
+    hasTarget: int
+    originalImgSize: List[int]
+    targets: List[dict]
+    processing_errors: List[str] = []
+
+
+def download_large_file(url, chunk_size=1024 * 1024):
+    """下载大型文件到临时文件、返回临时文件路径"""
+    try:
+        response = requests.get(url, stream=True, timeout=30)
+        response.raise_for_status()
+
+        file_size = int(response.headers.get('Content-Length', 0))
+
+        temp_file = tempfile.NamedTemporaryFile(delete=False, suffix='.png')  # 适配png格式
+        temp_file_path = temp_file.name
+        temp_file.close()
+
+        with open(temp_file_path, 'wb') as f, tqdm(
+                total=file_size, unit='B', unit_scale=True,
+                desc=f"下载 {os.path.basename(urlparse(url).path)}"
+        ) as pbar:
+            for chunk in response.iter_content(chunk_size=chunk_size):
+                if chunk:
+                    f.write(chunk)
+                    pbar.update(len(chunk))
+
+        return temp_file_path
+
+    except Exception as e:
+        error_msg = f"下载失败: {str(e)}"
+        print(error_msg)
+        if 'temp_file_path' in locals():
+            try:
+                os.remove(temp_file_path)
+            except:
+                pass
+        raise Exception(error_msg)
+
+
+def slice_large_image(image_path, slice_size=1024, overlap=100):
+    """切分大图为切片、返回切片数据和位置信息"""
+    img = cv2.imread(image_path)
+    if img is None:
+        raise ValueError(f"无法读取图像: {image_path}")
+
+    h, w = img.shape[:2]
+    step = slice_size - overlap
+    num_rows = (h + step - 1) // step
+    num_cols = (w + step - 1) // step
+
+    slices = []
+    for i in range(num_rows):
+        for j in range(num_cols):
+            y1 = i * step
+            x1 = j * step
+            y2 = min(y1 + slice_size, h)
+            x2 = min(x1 + slice_size, w)
+
+            if y2 - y1 < slice_size:
+                y1 = max(0, y2 - slice_size)
+            if x2 - x1 < slice_size:
+                x1 = max(0, x2 - slice_size)
+
+            slice_img = img[y1:y2, x1:x2]
+            slices.append((x1, y1, slice_img))
+
+    return slices, (h, w)
+
+
+def extract_detection_info(result, slice_offset_x, slice_offset_y):
+    """从YOLO OBB结果中提取检测框信息（修正宽高计算）"""
+    detections = []
+
+    if result.obb is not None and len(result.obb) > 0:
+        obb_data = result.obb
+        obb_xyxy = obb_data.xyxy.cpu().numpy()
+        classes = obb_data.cls.cpu().numpy()
+        confidences = obb_data.conf.cpu().numpy()
+
+        for i in range(len(obb_data)):
+            x1_slice, y1_slice, x2_slice, y2_slice = obb_xyxy[i]
+            # 计算实际宽高（x方向为宽，y方向为高）
+            width = x2_slice - x1_slice
+            height = y2_slice - y1_slice
+
+            # 转换为全局坐标
+            x1_global = x1_slice + slice_offset_x
+            y1_global = y1_slice + slice_offset_y
+
+            cls_id = int(classes[i])
+            confidence = float(confidences[i])
+            class_name = result.names[cls_id]
+
+            detection_info = {
+                "type": class_name,
+                "size": [int(round(width)), int(round(height))],
+                "leftTopPoint": [int(round(x1_global)), int(round(y1_global))],
+                "score": round(confidence, 4)
+            }
+            detections.append(detection_info)
+
+    return detections
+
+
+def detect_large_image_from_url(image_url: str, slice_size: int = 1024, overlap: int = 100) -> DetectionResponse:
+    """
+    封装后的检测方法：从图片URL处理大图、返回DetectionResponse对象
+    """
+    # 动态拼接固定model_path（当前文件同级目录下）
+    current_dir = os.path.dirname(os.path.abspath(__file__))
+    model_path = os.path.join(current_dir, "models", "solor_bracket_model", "best.pt")
+
+    processing_errors = []
+    all_detections = []
+    original_size = [0, 0]
+
+    try:
+        # 验证模型文件是否存在
+        if not os.path.exists(model_path):
+            raise FileNotFoundError(f"模型文件不存在：{model_path}")
+
+        # 下载图像
+        temp_file_path = download_large_file(image_url)
+
+        try:
+            # 切分图像
+            slices_info, (h, w) = slice_large_image(temp_file_path, slice_size, overlap)
+            original_size = [w, h]
+            print(f"完成切片: 共 {len(slices_info)} 个切片")
+
+            # 加载模型并预测
+            model = YOLO(model_path)
+            print("开始逐张预测切片...")
+
+            for i, (x1, y1, slice_img) in enumerate(slices_info, 1):
+                print(f"预测第 {i}/{len(slices_info)} 个切片")
+                result = model(slice_img, conf=0.5, verbose=False)[0]
+                slice_detections = extract_detection_info(result, x1, y1)
+                all_detections.extend(slice_detections)
+                print(f"  本切片检测到 {len(slice_detections)} 个目标")
+
+        finally:
+            # 确保临时文件删除
+            if os.path.exists(temp_file_path):
+                try:
+                    os.remove(temp_file_path)
+                    print("临时文件已删除")
+                except Exception as e:
+                    error_msg = f"删除临时文件失败: {str(e)}"
+                    print(error_msg)
+                    processing_errors.append(error_msg)
+
+    except Exception as e:
+        # 捕获所有异常并记录
+        error_msg = str(e)
+        processing_errors.append(error_msg)
+        print(f"处理异常: {error_msg}")
+
+    # 构建并返回DetectionResponse对象
+    return DetectionResponse(
+        hasTarget=1 if len(all_detections) > 0 else 0,
+        originalImgSize=original_size,
+        targets=all_detections,
+        processing_errors=processing_errors
+    )