2 月之前 · 4a506625db
--- a/README.md
+++ b/README.md
@@ -1,172 +1,85 @@
 
															-# 无人机检测 ONNX 模型推理工具
														
 
															+# UAV Detection System
														
 
															-## 项目概述
														
 
															-基于ONNX Runtime的无人机目标检测解决方案，支持：
														
 
															-- GPU加速推理（需CUDA环境）
														
 
															-- 自适应图像预处理流水线（CPU/GPU双模式）
														
 
															-- 误报过滤机制（ORB特征匹配）
														
 
															-- 多格式检测报告生成（CSV/Excel）
														
 
															+基于 ONNX 的无人机检测系统，支持单张图片和批量处理。
														
 
															-## 项目结构
														
 
															-```
														
 
															-Model/
														
 
															-├── src/                    # 源代码目录
														
 
															-│   ├── core/              # 核心功能模块
														
 
															-│   │   ├── inference.py   # 推理主程序
														
 
															-│   │   ├── feature_extractor.py
														
 
															-│   │   └── image_validation.py
														
 
															-│   ├── utils/             # 工具函数
														
 
															-│   │   ├── visualizer.py  # 可视化工具
														
 
															-│   │   └── dataset.py     # 数据集工具
														
 
															-│   └── analysis/          # 分析工具
														
 
															-│       ├── hotspot_analyzer.py
														
 
															-│       └── report_generator.py
														
 
															-├── data/                  # 数据目录
														
 
															-│   ├── false_positive/   # 误报样本
														
 
															-│   └── models/           # 模型文件
														
 
															-├── tests/                # 测试目录
														
 
															-├── outputs/              # 输出目录
														
 
															-└── docs/                 # 文档目录
														
 
															-```
														
 
															+## 功能特点
														
 
															+
														
 
															+- 支持 ONNX 模型推理
														
 
															+- 支持 CUDA 加速
														
 
															+- 支持批量处理图片
														
 
															+- 自动生成检测报告（CSV格式）
														
 
															+- 支持误报过滤
														
 
															+- 支持检测框面积比例限制
														
 
															+- 支持保存未检测到目标的图片
														
 
															 ## 环境要求
														
 
															-- Python 3.8+ 
														
 
															-- CUDA环境（如需GPU加速）
														
 
															-- 依赖库：
														
 
															-```bash
														
 
															-pip install -r requirements.txt
														
 
															-```
														
 
															-## 快速开始
														
 
															+- Python 3.8+
														
 
															+- OpenCV 4.5+
														
 
															+- ONNX Runtime 1.9+
														
 
															+- CUDA 11.0+ (可选，用于GPU加速)
														
 
															+
														
 
															+## 安装依赖
														
 
															-### 1. 安装依赖
														
 
															 ```bash
														
 
															 pip install -r requirements.txt
														
 
															 ```
														
 
															-### 2. 运行推理
														
 
															-在项目根目录下运行：
														
 
															+## 使用方法
														
 
															-#### 使用图形界面（推荐）
														
 
															-```bash
														
 
															-python -m src.core.inference --gui
														
 
															-```
														
 
															+### 命令行模式
														
 
															-#### 单张图片检测
														
 
															 ```bash
														
 
															-python -m src.core.inference --input 图片路径 --threshold 0.5 --output results --report excel
														
 
															-```
														
 
															+# 处理单张图片
														
 
															+python -m src.core.inference --input path/to/image.jpg --output results
														
 
															-#### 批量检测目录
														
 
															-```bash
														
 
															-python -m src.core.inference --input 图片目录 --max-bbox-ratio 0.1 --output batch_results --report all
														
 
															-```
														
 
															+# 处理整个目录
														
 
															+python -m src.core.inference --input path/to/images_dir --output results
														
 
															-## 参数说明
														
 
															-| 参数 | 类型 | 默认值 | 说明 |
														
 
															-|------|------|-------|-----|
														
 
															-| --input | path | 必填 | 输入图像路径/目录 |
														
 
															-| --threshold | float | 0.45 | 检测置信度阈值 |
														
 
															-| --max-bbox-ratio | float | 0.05 | 最大检测框面积比例 |
														
 
															-| --output | path | 自动生成 | 输出目录（自动创建） |
														
 
															-| --report | [csv/excel/all] | excel | 报告格式 |
														
 
															-| --save-empty | flag | False | 保存无检测结果的图像 |
														
 
															-| --gui | flag | False | 启用图形界面选择输入目录 |
														
 
															-
														
 
															-## 结果输出
														
 
															-输出目录包含：
														
 
															-- `目标截图/`：检测到的无人机目标截图
														
 
															-- `检测报告.xlsx`：包含检测时间、置信度、坐标等详细信息
														
 
															-- 带检测框的标注图像
														
 
															-
														
 
															-## 模型管理
														
 
															-- 模型文件位置：`data/models/UAV-250321.onnx`
														
 
															-- 模型版本通过文件名自动识别（如：UAV-250321.onnx 版本号为250321）
														
 
															-
														
 
															-## 常见问题
														
 
															-Q: 如何启用GPU加速？
														
 
															-A: 确保安装onnxruntime-gpu并配置CUDA环境，程序会自动优先使用GPU
														
 
															-
														
 
															-Q: 误报特征库如何更新？
														
 
															-A: 将误报样本放入data/false_positive目录，程序启动时会自动加载
														
 
															-
														
 
															-## 开发指南
														
 
															-1. 代码规范
														
 
															-   - 遵循PEP 8编码规范
														
 
															-   - 使用类型注解
														
 
															-   - 编写单元测试
														
 
															-
														
 
															-2. 测试
														
 
															-```bash
														
 
															-# 运行测试
														
 
															-pytest tests/
														
 
															+# 调整检测参数
														
 
															+python -m src.core.inference --input path/to/image.jpg --threshold 0.6 --max-bbox-ratio 0.1
														
 
															-# 生成测试覆盖率报告
														
 
															-pytest --cov=src tests/
														
 
															+# 保存未检测到目标的图片
														
 
															+python -m src.core.inference --input path/to/images_dir --save-empty
														
 
															 ```
														
 
															-3. 文档
														
 
															-   - 使用Google风格文档字符串
														
 
															-   - 保持README.md更新
														
 
															-   - 重要功能添加使用示例
														
 
															-
														
 
															-## 性能指标说明
														
 
															-
														
 
															-### 1. 基础统计指标
														
 
															+### 图形界面模式
														
 
															-- **总样本数**：CSV文件中所有唯一的图像文件数量
														
 
															-- **检测到的目标总数**：模型检测到的所有目标数量
														
 
															-- **真实目标总数（TP）**：确认的真实无人机目标数量
														
 
															-- **误报目标数（FP）**：错误检测为非无人机目标的数量
														
 
															-- **真阴性数量（TN）**：正确识别为非无人机目标的数量
														
 
															-
														
 
															-### 2. 性能评估指标
														
 
															-
														
 
															-- **准确率（Accuracy）**
														
 
															-  - 计算公式：`(TP + TN) / (TP + FP + TN)`
														
 
															-  - 说明：反映模型整体正确分类的能力，即正确预测的样本占总样本的比例
														
 
															-  - 取值范围：0-1，越接近1表示模型整体性能越好
														
 
															-
														
 
															-- **精确率（Precision）**
														
 
															-  - 计算公式：`TP / (TP + FP)`
														
 
															-  - 说明：反映模型在预测为正样本（无人机）时的准确程度
														
 
															-  - 取值范围：0-1，越接近1表示模型在预测无人机时越准确
														
 
															-
														
 
															-- **召回率（Recall）**
														
 
															-  - 计算公式：`TP / (TP + FN)`
														
 
															-  - 说明：反映模型发现所有真实无人机目标的能力
														
 
															-  - 取值范围：0-1，越接近1表示模型发现真实无人机的能力越强
														
 
															-
														
 
															-- **F1分数（F1 Score）**
														
 
															-  - 计算公式：`2 * (Precision * Recall) / (Precision + Recall)`
														
 
															-  - 说明：精确率和召回率的调和平均数，用于平衡精确率和召回率
														
 
															-  - 取值范围：0-1，越接近1表示模型在精确率和召回率之间取得更好的平衡
														
 
															-
														
 
															-- **误报率/虚警率（False Alarm Rate）**
														
 
															-  - 计算公式：`FP / (TN + FP)`
														
 
															-  - 说明：反映模型将非无人机目标错误识别为无人机的比例
														
 
															-  - 取值范围：0-1，越接近0表示模型在避免误报方面表现越好
														
 
															-
														
 
															-## 使用方法
														
 
															-
														
 
															-1. 运行推理：
														
 
															 ```bash
														
 
															-python src/core/inference.py
														
 
															+python -m src.core.inference --gui
														
 
															 ```
														
 
															-2. 分析性能：
														
 
															-```bash
														
 
															-python src/analysis/performance_analyzer.py
														
 
															-```
														
 
															+## 参数说明
														
 
															+
														
 
															+- `--input`: 输入图像路径或目录（必需）
														
 
															+- `--output`: 输出目录路径，默认为输入目录名+_results
														
 
															+- `--threshold`: 检测置信度阈值，默认0.5
														
 
															+- `--max-bbox-ratio`: 检测框最大面积比例阈值，默认0.05
														
 
															+- `--save-empty`: 是否保存未检测到目标的图片
														
 
															+- `--gui`: 启用图形界面选择输入目录
														
 
															 ## 输出说明
														
 
															-运行性能分析后，将在结果目录下生成`performance_stats.txt`文件，包含：
														
 
															-1. 详细统计信息（总样本数、检测目标数等）
														
 
															-2. 性能指标（准确率、精确率、召回率等）
														
 
															+程序会在输出目录中生成以下内容：
														
 
															+
														
 
															+- 检测结果图片（带检测框）
														
 
															+- `detection_report.csv`: 检测报告，包含以下信息：
														
 
															+  - 图片路径
														
 
															+  - 检测时间
														
 
															+  - 是否检测到目标
														
 
															+  - 检测框坐标
														
 
															+  - 置信度分数
														
 
															 ## 注意事项
														
 
															 1. 确保模型文件路径正确
														
 
															-2. 确保输入图像格式正确
														
 
															-3. 性能分析前需要将确认的真实目标放入`targets_all_True`目录
														
 
															+2. 如果使用GPU加速，请确保CUDA环境配置正确
														
 
															+3. 批量处理时建议使用相对较小的图片尺寸以提高处理速度
														
 
															+4. 检测报告会自动覆盖同名文件，请注意备份
														
 
															+
														
 
															+## 更新日志
														
 
															+
														
 
															+### 2024-03-29
														
 
															+- 移除Excel报告生成功能
														
 
															+- 优化检测报告生成逻辑
														
 
															+- 修复模型加载和属性访问问题
														
--- a/src/analysis/performance_analyzer.py
+++ b/src/analysis/performance_analyzer.py
@@ -209,7 +209,7 @@ class PerformanceAnalyzer:
 
															 def main():
														
 
															     # 示例使用
														
 
															-    result_dir = r"D:\PythonProject\Model\Output\output_20250328_161223_results"
														
 
															+    result_dir = r"D:\PythonProject\Model\output_20250329_140816_results"
														
 
															     analyzer = PerformanceAnalyzer(result_dir)
														
 
															     # 分析性能
														
--- a/src/core/compare_outputs.py
+++ b/src/core/compare_outputs.py
@@ -0,0 +1,66 @@
 
															+import os
														
 
															+import shutil
														
 
															+from pathlib import Path
														
 
															+import re
														
 
															+
														
 
															+def get_base_filename(filename):
														
 
															+    """获取文件名的基础部分（去除时间戳和序号后缀）"""
														
 
															+    # 匹配形如 _20250414094956928104_0.jpg 的后缀
														
 
															+    pattern = r'(_\d+_\d+\.jpg)$'
														
 
															+    match = re.search(pattern, filename)
														
 
															+    if match:
														
 
															+        # 返回去除后缀的文件名
														
 
															+        return filename[:-len(match.group(1))]
														
 
															+    return filename
														
 
															+
														
 
															+def compare_directories(dir1, dir2, output_dir):
														
 
															+    """比较两个目录中的文件并整理差异"""
														
 
															+    # 创建输出目录
														
 
															+    os.makedirs(output_dir, exist_ok=True)
														
 
															+    
														
 
															+    # 获取两个目录中的所有文件
														
 
															+    dir1_files = set(os.listdir(dir1))
														
 
															+    dir2_files = set(os.listdir(dir2))
														
 
															+    
														
 
															+    # 创建文件名映射
														
 
															+    dir1_base_files = {get_base_filename(f): f for f in dir1_files}
														
 
															+    dir2_base_files = {get_base_filename(f): f for f in dir2_files}
														
 
															+    
														
 
															+    # 找出只在dir1中存在的文件
														
 
															+    only_in_dir1 = set(dir1_base_files.keys()) - set(dir2_base_files.keys())
														
 
															+    # 找出只在dir2中存在的文件
														
 
															+    only_in_dir2 = set(dir2_base_files.keys()) - set(dir1_base_files.keys())
														
 
															+    
														
 
															+    # 创建子目录
														
 
															+    dir1_only_dir = os.path.join(output_dir, "only_in_dir1")
														
 
															+    dir2_only_dir = os.path.join(output_dir, "only_in_dir2")
														
 
															+    os.makedirs(dir1_only_dir, exist_ok=True)
														
 
															+    os.makedirs(dir2_only_dir, exist_ok=True)
														
 
															+    
														
 
															+    # 复制文件
														
 
															+    for base_name in only_in_dir1:
														
 
															+        src_file = os.path.join(dir1, dir1_base_files[base_name])
														
 
															+        dst_file = os.path.join(dir1_only_dir, dir1_base_files[base_name])
														
 
															+        shutil.copy2(src_file, dst_file)
														
 
															+        print(f"复制 {src_file} 到 {dst_file}")
														
 
															+    
														
 
															+    for base_name in only_in_dir2:
														
 
															+        src_file = os.path.join(dir2, dir2_base_files[base_name])
														
 
															+        dst_file = os.path.join(dir2_only_dir, dir2_base_files[base_name])
														
 
															+        shutil.copy2(src_file, dst_file)
														
 
															+        print(f"复制 {src_file} 到 {dst_file}")
														
 
															+    
														
 
															+    # 打印统计信息
														
 
															+    print(f"\n统计信息:")
														
 
															+    print(f"目录1中的文件总数: {len(dir1_files)}")
														
 
															+    print(f"目录2中的文件总数: {len(dir2_files)}")
														
 
															+    print(f"只在目录1中存在的文件数: {len(only_in_dir1)}")
														
 
															+    print(f"只在目录2中存在的文件数: {len(only_in_dir2)}")
														
 
															+    print(f"共同存在的文件数: {len(dir1_files) - len(only_in_dir1)}")
														
 
															+
														
 
															+if __name__ == "__main__":
														
 
															+    dir1 = r"D:\PythonProject\Model\output_20250329_140816_results"
														
 
															+    dir2 = r"D:\PythonProject\Model\Output\output_20250329_140816_results"
														
 
															+    output_dir = r"D:\PythonProject\Model\output_differences"
														
 
															+    
														
 
															+    compare_directories(dir1, dir2, output_dir) 
														
--- a/src/core/detect.py
+++ b/src/core/detect.py
--- a/src/core/infer.py
+++ b/src/core/infer.py
@@ -0,0 +1,168 @@
 
															+import os
														
 
															+import cv2
														
 
															+import numpy as np
														
 
															+import onnxruntime
														
 
															+from typing import List, Dict, Optional
														
 
															+from datetime import datetime
														
 
															+import argparse
														
 
															+from tqdm import tqdm
														
 
															+
														
 
															+class UAVDetector:
														
 
															+    def __init__(self, model_path: str, prob_threshold: float = 0.5, max_bbox_ratio: float = 0.05):
														
 
															+        # 初始化ONNX会话
														
 
															+        so = onnxruntime.SessionOptions()
														
 
															+        so.log_severity_level = 3
														
 
															+        self.session = onnxruntime.InferenceSession(
														
 
															+            model_path, 
														
 
															+            so,
														
 
															+            providers=['CUDAExecutionProvider', 'CPUExecutionProvider']
														
 
															+        )
														
 
															+        
														
 
															+        # 模型参数设置
														
 
															+        self.input_size = (640, 640)  # width, height
														
 
															+        self.mean_ = np.array([0.485, 0.456, 0.406], dtype=np.float32)
														
 
															+        self.std_ = np.array([0.229, 0.224, 0.225], dtype=np.float32)
														
 
															+        self.confThreshold = prob_threshold
														
 
															+        self.max_bbox_ratio = max_bbox_ratio
														
 
															+        
														
 
															+        # 获取输入输出名称
														
 
															+        self.input_name = self.session.get_inputs()[0].name
														
 
															+        self.output_name = self.session.get_outputs()[0].name
														
 
															+
														
 
															+    def preprocess(self, srcimg: np.ndarray) -> tuple:
														
 
															+        """图像预处理"""
														
 
															+        img = cv2.cvtColor(srcimg, cv2.COLOR_BGR2RGB)
														
 
															+        img = cv2.resize(img, self.input_size, interpolation=cv2.INTER_LINEAR)
														
 
															+        img = img.astype(np.float32)
														
 
															+        img = img / 255.
														
 
															+        img -= self.mean_[None, None, :]
														
 
															+        img /= self.std_[None, None, :]
														
 
															+        img = np.transpose(img, [2, 0, 1])
														
 
															+        scale_factor = np.array([1., 1.], dtype=np.float32)
														
 
															+        return img, scale_factor
														
 
															+
														
 
															+    def nms(self, boxes: np.ndarray, scores: np.ndarray, conf_threshold: float, iou_threshold: float) -> List[int]:
														
 
															+        """非极大值抑制"""
														
 
															+        x1 = boxes[:, 0]
														
 
															+        y1 = boxes[:, 1]
														
 
															+        x2 = boxes[:, 2]
														
 
															+        y2 = boxes[:, 3]
														
 
															+        areas = (x2 - x1 + 1) * (y2 - y1 + 1)
														
 
															+        order = scores.argsort()[0][::-1]
														
 
															+        keep = []
														
 
															+        
														
 
															+        while order.size > 0:
														
 
															+            i = order[0]
														
 
															+            keep.append(i)
														
 
															+            xx1 = np.maximum(x1[i], x1[order[1:]])
														
 
															+            yy1 = np.maximum(y1[i], y1[order[1:]])
														
 
															+            xx2 = np.minimum(x2[i], x2[order[1:]])
														
 
															+            yy2 = np.minimum(y2[i], y2[order[1:]])
														
 
															+            w = np.maximum(0.0, xx2 - xx1 + 1)
														
 
															+            h = np.maximum(0.0, yy2 - yy1 + 1)
														
 
															+            inter = w * h
														
 
															+            ovr = inter / (areas[i] + areas[order[1:]] - inter)
														
 
															+            inds = np.where(ovr <= iou_threshold)[0]
														
 
															+            order = order[inds + 1]
														
 
															+        return keep
														
 
															+
														
 
															+    def detect(self, srcimg: np.ndarray) -> tuple:
														
 
															+        """执行检测"""
														
 
															+        # 预处理
														
 
															+        img, scale_factor = self.preprocess(srcimg)
														
 
															+        inputs = {'image': img[None, :, :, :], 'scale_factor': scale_factor[None, :]}
														
 
															+        ort_inputs = {i.name: inputs[i.name] for i in self.session.get_inputs() if i.name in inputs}
														
 
															+        
														
 
															+        # 推理
														
 
															+        output = self.session.run(None, ort_inputs)
														
 
															+        bbox, confidence = output
														
 
															+        
														
 
															+        # 过滤低置信度检测
														
 
															+        keep_idx = (confidence[:, 0] > self.confThreshold)
														
 
															+        bbox = bbox[keep_idx, :]
														
 
															+        confidence = confidence[:, keep_idx]
														
 
															+
														
 
															+        # 坐标转换
														
 
															+        ratioh = srcimg.shape[0] / self.input_size[1]
														
 
															+        ratiow = srcimg.shape[1] / self.input_size[0]
														
 
															+        bbox[:, 0] *= ratiow
														
 
															+        bbox[:, 1] *= ratioh
														
 
															+        bbox[:, 2] *= ratiow
														
 
															+        bbox[:, 3] *= ratioh
														
 
															+
														
 
															+        # NMS处理
														
 
															+        keep = self.nms(bbox, confidence, self.confThreshold, 0.4)
														
 
															+
														
 
															+        # 后处理
														
 
															+        outres = []
														
 
															+        img_out = srcimg.copy()
														
 
															+        for idx in keep:
														
 
															+            xmin, ymin, xmax, ymax = bbox[idx].astype(int)
														
 
															+            
														
 
															+            # 检查检测框面积比例
														
 
															+            bbox_area = (xmax - xmin) * (ymax - ymin)
														
 
															+            image_area = srcimg.shape[0] * srcimg.shape[1]
														
 
															+            if bbox_area / image_area > self.max_bbox_ratio:
														
 
															+                continue
														
 
															+                
														
 
															+            score = confidence[0][idx]
														
 
															+            outres.append([xmin, ymin, xmax, ymax, score])
														
 
															+            
														
 
															+            # 绘制检测框和标签
														
 
															+            cv2.rectangle(img_out, (xmin, ymin), (xmax, ymax), (0, 0, 255), thickness=2)
														
 
															+            cv2.putText(img_out, f"UAV: {score:.2f}", (xmin, ymin - 10),
														
 
															+                        cv2.FONT_HERSHEY_SIMPLEX, 0.4, (0, 255, 0), thickness=1)
														
 
															+            
														
 
															+        return img_out, outres
														
 
															+
														
 
															+def process_image(detector: UAVDetector, image_path: str, output_dir: str) -> int:
														
 
															+    """处理单张图像"""
														
 
															+    srcimg = cv2.imread(image_path)
														
 
															+    if srcimg is None:
														
 
															+        print(f"无法读取图像: {image_path}")
														
 
															+        return 0
														
 
															+        
														
 
															+    processed_img, detections = detector.detect(srcimg)
														
 
															+    
														
 
															+    # 保存结果
														
 
															+    if detections or args.save_empty:
														
 
															+        filename = os.path.basename(image_path)
														
 
															+        output_path = os.path.join(output_dir, filename)
														
 
															+        cv2.imwrite(output_path, processed_img)
														
 
															+        
														
 
															+    return len(detections)
														
 
															+
														
 
															+if __name__ == '__main__':
														
 
															+    parser = argparse.ArgumentParser(description='UAV Detection using ONNX model')
														
 
															+    parser.add_argument('--model', type=str, required=True, help='ONNX模型路径')
														
 
															+    parser.add_argument('--input', type=str, required=True, help='输入图像路径或目录')
														
 
															+    parser.add_argument('--output', type=str, default='output', help='输出目录')
														
 
															+    parser.add_argument('--threshold', type=float, default=0.5, help='检测置信度阈值')
														
 
															+    parser.add_argument('--max-bbox-ratio', type=float, default=0.05, help='检测框最大面积比例阈值')
														
 
															+    parser.add_argument('--save-empty', action='store_true', help='是否保存未检测到目标的图片')
														
 
															+    args = parser.parse_args()
														
 
															+
														
 
															+    # 创建输出目录
														
 
															+    os.makedirs(args.output, exist_ok=True)
														
 
															+
														
 
															+    # 初始化检测器
														
 
															+    detector = UAVDetector(
														
 
															+        model_path=args.model,
														
 
															+        prob_threshold=args.threshold,
														
 
															+        max_bbox_ratio=args.max_bbox_ratio
														
 
															+    )
														
 
															+
														
 
															+    # 处理输入
														
 
															+    if os.path.isdir(args.input):
														
 
															+        total_detections = 0
														
 
															+        image_files = []
														
 
															+        for root, _, files in os.walk(args.input):
														
 
															+            image_files.extend([os.path.join(root, f) for f in files if f.lower().endswith(('.jpg', '.png'))])
														
 
															+            
														
 
															+        for img_file in tqdm(image_files, desc='Processing images'):
														
 
															+            total_detections += process_image(detector, img_file, args.output)
														
 
															+            
														
 
															+        print(f'批量处理完成！共检测到 {total_detections} 个目标')
														
 
															+    else:
														
 
															+        detections = process_image(detector, args.input, args.output)
														
 
															+        print(f'处理完成！检测到 {detections} 个目标') 
														
--- a/src/core/inference.py
+++ b/src/core/inference.py
@@ -20,30 +20,34 @@ class ONNXDetector:
 
															         folder_path = filedialog.askdirectory(title='选择输入目录')
														
 
															         return folder_path if folder_path else None
														
 
															-    def __init__(self, model_path: str = 'D:\PythonProject\Model\Data\models\250411_Anti_UAV.onnx', threshold: float = 0.5, 
														
 
															+    def __init__(self, model_path: str = 'D:/PythonProject/Model/Data/models/250411_Anti_UAV.onnx', threshold: float = 0.5, 
														
 
															                  output_dir: str = "None", save_empty: bool = False, 
														
 
															-                 max_bbox_ratio: float = 0.5,  # 已有该参数
														
 
															+                 max_bbox_ratio: float = 0.5,
														
 
															                  input_dir: str = "None"):
														
 
															         self.image_count = 0
														
 
															         self.detection_records = []
														
 
															         self.model_path = model_path
														
 
															         self.input_dir = input_dir
														
 
															+        self.save_empty = save_empty
														
 
															+        self.threshold = threshold
														
 
															+        self.confThreshold = threshold
														
 
															         # 初始化ONNX会话
														
 
															+        so = ort.SessionOptions()
														
 
															+        so.log_severity_level = 3
														
 
															         self.providers = ['CUDAExecutionProvider', 'CPUExecutionProvider']
														
 
															-        self.session = ort.InferenceSession(model_path, providers=self.providers)
														
 
															+        self.session = ort.InferenceSession(model_path, so, providers=self.providers)
														
 
															-        # 获取模型输入尺寸
														
 
															-        input_dims = self.session.get_inputs()[0].shape
														
 
															-        self.input_shape = tuple([dim if isinstance(dim, int) else 1 for dim in input_dims])
														
 
															+        # 模型参数设置
														
 
															+        self.input_size = (640, 640)  # width, height
														
 
															+        self.mean_ = np.array([0.485, 0.456, 0.406], dtype=np.float32)
														
 
															+        self.std_ = np.array([0.229, 0.224, 0.225], dtype=np.float32)
														
 
															+        self.max_bbox_ratio = max_bbox_ratio
														
 
															         # 从模型路径解析版本号
														
 
															-        self.model_version = model_path.split('-')[-1].split('.')[0] if '-' in model_path else '1.0'
														
 
															-        self.input_size = f"{self.input_shape[2]}x{self.input_shape[3]}"
														
 
															+        self.model_version = os.path.basename(model_path).split('.')[0]
														
 
															-        self.threshold = threshold
														
 
															-        self.max_bbox_ratio = max_bbox_ratio  # 已有该赋值
														
 
															-        self.save_empty = save_empty
														
 
															+        # 获取输入输出名称
														
 
															         self.input_name = self.session.get_inputs()[0].name
														
 
															         self.output_name = self.session.get_outputs()[0].name
														
@@ -82,7 +86,7 @@ class ONNXDetector:
 
															                 return None
														
 
															             # GPU预处理流水线
														
 
															-            gpu_resized = cv2.cuda.resize(self.gpu_frame, (self.input_shape[3], self.input_shape[2]))
														
 
															+            gpu_resized = cv2.cuda.resize(self.gpu_frame, self.input_size)
														
 
															             gpu_rgb = cv2.cuda.cvtColor(gpu_resized, cv2.COLOR_BGR2RGB)
														
 
															             # 下载到CPU进行后续处理
														
@@ -96,14 +100,41 @@ class ONNXDetector:
 
															                 return None
														
 
															             self.orig_h, self.orig_w = image_orig.shape[:2]
														
 
															-            image_orig = cv2.resize(image_orig, (self.input_shape[3], self.input_shape[2]))
														
 
															+            image_orig = cv2.resize(image_orig, self.input_size)
														
 
															             image_orig = cv2.cvtColor(image_orig, cv2.COLOR_BGR2RGB)
														
 
															         # 统一的后处理
														
 
															         image = image_orig.astype(np.float32) / 255.0
														
 
															+        image -= self.mean_[None, None, :]
														
 
															+        image /= self.std_[None, None, :]
														
 
															         image = np.transpose(image, (2, 0, 1))  # CHW 格式
														
 
															         return np.expand_dims(image, axis=0)
														
 
															+    def nms(self, boxes: np.ndarray, scores: np.ndarray, conf_threshold: float, iou_threshold: float) -> List[int]:
														
 
															+        """非极大值抑制"""
														
 
															+        x1 = boxes[:, 0]
														
 
															+        y1 = boxes[:, 1]
														
 
															+        x2 = boxes[:, 2]
														
 
															+        y2 = boxes[:, 3]
														
 
															+        areas = (x2 - x1 + 1) * (y2 - y1 + 1)
														
 
															+        order = scores.argsort()[0][::-1]
														
 
															+        keep = []
														
 
															+        
														
 
															+        while order.size > 0:
														
 
															+            i = order[0]
														
 
															+            keep.append(i)
														
 
															+            xx1 = np.maximum(x1[i], x1[order[1:]])
														
 
															+            yy1 = np.maximum(y1[i], y1[order[1:]])
														
 
															+            xx2 = np.minimum(x2[i], x2[order[1:]])
														
 
															+            yy2 = np.minimum(y2[i], y2[order[1:]])
														
 
															+            w = np.maximum(0.0, xx2 - xx1 + 1)
														
 
															+            h = np.maximum(0.0, yy2 - yy1 + 1)
														
 
															+            inter = w * h
														
 
															+            ovr = inter / (areas[i] + areas[order[1:]] - inter)
														
 
															+            inds = np.where(ovr <= iou_threshold)[0]
														
 
															+            order = order[inds + 1]
														
 
															+        return keep
														
 
															+
														
 
															     def inference(self, input_data: np.ndarray) -> np.ndarray:
														
 
															         """执行模型推理"""
														
 
															         scale_factor = np.array([[1, 1]], dtype=np.float32)
														
@@ -149,22 +180,32 @@ class ONNXDetector:
 
															                 return True
														
 
															         return False
														
 
															-    def postprocess(self, detections: np.ndarray, image_orig: np.ndarray, image_path: str) -> int:
														
 
															+    def postprocess(self, detections: np.ndarray, image_orig: np.ndarray, image_path: str) -> tuple:
														
 
															         """后处理检测结果"""
														
 
															         valid_detections = 0
														
 
															         img_out = image_orig.copy()
														
 
															         detections_list = []
														
 
															-        for det in detections:
														
 
															-            class_id = int(det[0])
														
 
															-            confidence = det[1]
														
 
															+        # 过滤低置信度检测
														
 
															+        keep_idx = (detections[:, 1] > self.confThreshold)
														
 
															+        detections = detections[keep_idx]
														
 
															+        
														
 
															+        if len(detections) == 0:
														
 
															+            return 0, img_out, []
														
 
															-            if confidence < self.threshold:
														
 
															-                continue
														
 
															+        # 坐标转换
														
 
															+        ratioh = self.orig_h / self.input_size[1]
														
 
															+        ratiow = self.orig_w / self.input_size[0]
														
 
															+        detections[:, 2:6] *= np.array([ratiow, ratioh, ratiow, ratioh])
														
 
															+        
														
 
															+        # NMS处理
														
 
															+        keep = self.nms(detections[:, 2:6], detections[:, 1:2], self.confThreshold, 0.4)
														
 
															+        
														
 
															+        for idx in keep:
														
 
															+            class_id = int(detections[idx, 0])
														
 
															+            confidence = detections[idx, 1]
														
 
															+            x1, y1, x2, y2 = detections[idx, 2:6].astype(int)
														
 
															-            # 坐标转换和边界检查
														
 
															-            x1, y1, x2, y2 = self._convert_coordinates(det[2:6])
														
 
															-
														
 
															             # 计算检测框面积比例
														
 
															             bbox_area = (x2 - x1) * (y2 - y1)
														
 
															             image_area = self.orig_w * self.orig_h
														
@@ -194,28 +235,12 @@ class ONNXDetector:
 
															                 'class_id': class_id,
														
 
															                 'confidence': float(confidence),
														
 
															                 'bbox': [x1, y1, x2, y2],
														
 
															-            'orig_w': self.orig_w,
														
 
															-            'orig_h': self.orig_h
														
 
															+                'orig_w': self.orig_w,
														
 
															+                'orig_h': self.orig_h
														
 
															             })
														
 
															         return valid_detections, img_out, detections_list
														
 
															-    def _convert_coordinates(self, coords: List[float]) -> tuple:
														
 
															-        """将模型输出坐标转换为原始图像尺寸"""
														
 
															-        x1 = int(coords[0] * self.orig_w / self.input_shape[3])
														
 
															-        y1 = int(coords[1] * self.orig_h / self.input_shape[2])
														
 
															-        x2 = int(coords[2] * self.orig_w / self.input_shape[3])
														
 
															-        y2 = int(coords[3] * self.orig_h / self.input_shape[2])
														
 
															-        
														
 
															-        # 边界检查
														
 
															-        clamp = lambda val, max_val: max(0, min(val, max_val - 1))
														
 
															-        return (
														
 
															-            clamp(x1, self.orig_w),
														
 
															-            clamp(y1, self.orig_h),
														
 
															-            clamp(x2, self.orig_w),
														
 
															-            clamp(y2, self.orig_h)
														
 
															-        )
														
 
															-
														
 
															     def process_image(self, image_path: str) -> int:
														
 
															         """端到端处理单张图像"""
														
 
															         input_data = self.preprocess(image_path)
														
@@ -257,8 +282,6 @@ if __name__ == '__main__':
 
															     parser.add_argument('--output', type=str, default=None, help='输出目录路径，默认为输入目录名+_results')
														
 
															     parser.add_argument('--max-bbox-ratio', type=float, default=0.05,
														
 
															                       help='检测框最大面积比例阈值，默认0.05')
														
 
															-    parser.add_argument('--report', type=str, choices=['csv', 'excel', 'all'], default='all',
														
 
															-                      help='输出报告格式: csv|excel|all')
														
 
															     parser.add_argument('--save-empty', action='store_true',
														
 
															                       help='是否保存未检测到目标的图片')
														
 
															     parser.add_argument('--gui', action='store_true',
														
@@ -282,7 +305,7 @@ if __name__ == '__main__':
 
															     # 初始化检测器时传递参数
														
 
															     detector = ONNXDetector(
														
 
															         threshold=args.threshold,
														
 
															-        max_bbox_ratio=args.max_bbox_ratio,  # 添加该参数传递
														
 
															+        max_bbox_ratio=args.max_bbox_ratio,
														
 
															         output_dir=args.output,
														
 
															         save_empty=args.save_empty,
														
 
															         input_dir=args.input if os.path.isdir(args.input) else None
														
@@ -301,14 +324,9 @@ if __name__ == '__main__':
 
															             total += detector.process_image(img_file)
														
 
															         print(f'批量处理完成！共检测到 {total} 个目标')
														
 
															-    # 生成检测报告
														
 
															-    if args.report in ('csv', 'all'):
														
 
															+        # 生成CSV报告
														
 
															         csv_path = os.path.join(detector.output_dir, 'detection_report.csv')
														
 
															         ReportGenerator(detector).generate_csv(csv_path)
														
 
															         print(f'CSV报告已生成: {csv_path}')
														
 
															-    if args.report in ('excel', 'all'):
														
 
															-        excel_path = os.path.join(detector.output_dir, 'detection_report.xlsx')
														
 
															-        ReportGenerator(detector).generate_excel(excel_path)
														
 
															-        print(f'Excel报告已生成: {excel_path}')
														
 
															     else:
														
 
															         detections = detector.process_image(args.input)