增加说明

增加联邦学习评价指标。bugfix: 修复训练模型参数聚合问题
训练模型配置
2025-05-10 17:23:06 +08:00 · 2025-05-10 17:22:56 +08:00 · 2025-05-10 16:19:00 +08:00 · 2025-05-10 16:18:37 +08:00 · 2025-05-07 10:41:36 +08:00 · 2025-05-07 10:41:06 +08:00
32 changed files with 944 additions and 3 deletions
--- a/.gitignore
+++ b/.gitignore
@@ -178,7 +178,7 @@ cython_debug/
 # ---> JetBrains
 # Covers JetBrains IDEs: IntelliJ, RubyMine, PhpStorm, AppCode, PyCharm, CLion, Android Studio, WebStorm and Rider
 # Reference: https://intellij-support.jetbrains.com/hc/en-us/articles/206544839
-
+.idea/
 # User-specific stuff
 .idea/**/workspace.xml
 .idea/**/tasks.xml
@@ -277,6 +277,7 @@ fabric.properties
 # Icon must end with two \r
 Icon

+
 # Thumbnails
 ._*

@@ -296,3 +297,10 @@ Network Trash Folder
 Temporary Items
 .apdisk

+# project files
+/whl_packages/
+runs/
+*.pt
+*.cache
+.vscode/
+*.json
--- a/README.md
+++ b/README.md
@@ -1,3 +1,35 @@
 # Graduation-Project

 毕业设计：基于YOLO和图像融合技术的无人机检测系统及安全性研究
+
+Linux 运行联邦训练
+```bash
+cd federated_learning
+```
+
+```bash
+nohup python -u yolov8_fed.py > runtime.log 2>&1 &
+```
+
+Linux 运行集中训练
+```bash
+cd yolov8
+```
+
+```bash
+nohup python -u yolov8_train.py > runtime.log 2>&1 &
+```
+
+实时监控日志文件
+```bash
+tail -f runtime.log
+```
+
+运行图像融合配准代码
+```bash
+cd image_fusion
+```
+
+```bash
+python Image_Registration_test.py
+```
--- a/dataset/train1/images/6.jpg
+++ b/dataset/train1/images/6.jpg
--- a/dataset/train1/images/7.jpg
+++ b/dataset/train1/images/7.jpg
--- a/dataset/train1/labels/6.txt
+++ b/dataset/train1/labels/6.txt
@@ -0,0 +1,2 @@
+0 0.5375 0.37395833333333334 0.253125 0.16458333333333333
+0 0.2890625 0.5833333333333334 0.196875 0.1125
--- a/dataset/train1/labels/7.txt
+++ b/dataset/train1/labels/7.txt
@@ -0,0 +1 @@
+0 0.36328125 0.525 0.7109375 0.8083333333333333
--- a/dataset/train1/train1.yaml
+++ b/dataset/train1/train1.yaml
@@ -0,0 +1,4 @@
+train: ./images
+val:   ../val
+nc:    1
+names: ['uav']
--- a/dataset/train2/images/000007.JPG
+++ b/dataset/train2/images/000007.JPG
--- a/dataset/train2/images/02.jpg
+++ b/dataset/train2/images/02.jpg
--- a/dataset/train2/labels/000007.txt
+++ b/dataset/train2/labels/000007.txt
@@ -0,0 +1 @@
+0 0.6934895833333333 0.6527777777777778 0.008854166666666666 0.018518518518518517
--- a/dataset/train2/labels/02.txt
+++ b/dataset/train2/labels/02.txt
@@ -0,0 +1 @@
+0 0.423698 0.593519 0.061979 0.029630
--- a/dataset/train2/train2.yaml
+++ b/dataset/train2/train2.yaml
@@ -0,0 +1,4 @@
+train: ./images
+val:   ../val
+nc:    1
+names: ['uav']
--- a/dataset/val/images/VS_P65.jpg
+++ b/dataset/val/images/VS_P65.jpg
--- a/dataset/val/images/VS_P66.jpg
+++ b/dataset/val/images/VS_P66.jpg
--- a/dataset/val/labels/VS_P65.txt
+++ b/dataset/val/labels/VS_P65.txt
@@ -0,0 +1 @@
+0 0.5109375 0.5322916666666667 0.125 0.13958333333333334
--- a/dataset/val/labels/VS_P66.txt
+++ b/dataset/val/labels/VS_P66.txt
@@ -0,0 +1 @@
+0 0.55078125 0.296875 0.0890625 0.08958333333333333
--- a/federated_learning/GenerateTestdata.sh
+++ b/federated_learning/GenerateTestdata.sh
@@ -0,0 +1,16 @@
+# 创建测试目录结构
+mkdir -p ./test_data/{client1,client2}/{train,val}/images
+mkdir -p ./test_data/{client1,client2}/{train,val}/labels
+
+# 生成虚拟数据（各客户端仅需2张图片）
+for client in client1 client2; do
+  for split in train val; do
+    # 创建空图片（128x128 RGB）
+    magick -size 128x128 xc:white test_data/${client}/${split}/images/img1.jpg
+    magick -size 128x128 xc:black test_data/${client}/${split}/images/img2.jpg
+
+    # 创建示例标签文件
+    echo "0 0.5 0.5 0.2 0.2" > test_data/${client}/${split}/labels/img1.txt
+    echo "1 0.3 0.3 0.4 0.4" > test_data/${client}/${split}/labels/img2.txt
+  done
+done
--- a/federated_learning/init.py
+++ b/federated_learning/init.py
--- a/federated_learning/config/client1_data.yaml
+++ b/federated_learning/config/client1_data.yaml
@@ -0,0 +1,4 @@
+train: ../test_data/client1/train/images
+val: ../test_data/client1/val/images
+nc: 2
+names: [ 'class0', 'class1' ]
--- a/federated_learning/config/client2_data.yaml
+++ b/federated_learning/config/client2_data.yaml
@@ -0,0 +1,4 @@
+train: ../test_data/client2/train/images
+val: ../test_data/client2/val/images
+nc: 2
+names: [ 'class0', 'class1' ]
--- a/federated_learning/yolo11n.pt
+++ b/federated_learning/yolo11n.pt
--- a/federated_learning/yolov8.yaml
+++ b/federated_learning/yolov8.yaml
@@ -0,0 +1,49 @@
+# Ultralytics 🚀 AGPL-3.0 License - https://ultralytics.com/license
+
+# Ultralytics YOLOv8 object detection model with P3/8 - P5/32 outputs
+# Model docs: https://docs.ultralytics.com/models/yolov8
+# Task docs: https://docs.ultralytics.com/tasks/detect
+
+# Parameters
+nc: 1 # number of classes
+scales: # model compound scaling constants, i.e. 'model=yolov8n.yaml' will call yolov8.yaml with scale 'n'
+  # [depth, width, max_channels]
+  n: [0.33, 0.25, 1024] # YOLOv8n summary: 129 layers, 3157200 parameters, 3157184 gradients, 8.9 GFLOPS
+  s: [0.33, 0.50, 1024] # YOLOv8s summary: 129 layers, 11166560 parameters, 11166544 gradients, 28.8 GFLOPS
+  m: [0.67, 0.75, 768] # YOLOv8m summary: 169 layers, 25902640 parameters, 25902624 gradients, 79.3 GFLOPS
+  l: [1.00, 1.00, 512] # YOLOv8l summary: 209 layers, 43691520 parameters, 43691504 gradients, 165.7 GFLOPS
+  x: [1.00, 1.25, 512] # YOLOv8x summary: 209 layers, 68229648 parameters, 68229632 gradients, 258.5 GFLOPS
+
+# YOLOv8.0n backbone
+backbone:
+  # [from, repeats, module, args]
+  - [-1, 1, Conv, [64, 3, 2]] # 0-P1/2
+  - [-1, 1, Conv, [128, 3, 2]] # 1-P2/4
+  - [-1, 3, C2f, [128, True]]
+  - [-1, 1, Conv, [256, 3, 2]] # 3-P3/8
+  - [-1, 6, C2f, [256, True]]
+  - [-1, 1, Conv, [512, 3, 2]] # 5-P4/16
+  - [-1, 6, C2f, [512, True]]
+  - [-1, 1, Conv, [1024, 3, 2]] # 7-P5/32
+  - [-1, 3, C2f, [1024, True]]
+  - [-1, 1, SPPF, [1024, 5]] # 9
+
+# YOLOv8.0n head
+head:
+  - [-1, 1, nn.Upsample, [None, 2, "nearest"]]
+  - [[-1, 6], 1, Concat, [1]] # cat backbone P4
+  - [-1, 3, C2f, [512]] # 12
+
+  - [-1, 1, nn.Upsample, [None, 2, "nearest"]]
+  - [[-1, 4], 1, Concat, [1]] # cat backbone P3
+  - [-1, 3, C2f, [256]] # 15 (P3/8-small)
+
+  - [-1, 1, Conv, [256, 3, 2]]
+  - [[-1, 12], 1, Concat, [1]] # cat head P4
+  - [-1, 3, C2f, [512]] # 18 (P4/16-medium)
+
+  - [-1, 1, Conv, [512, 3, 2]]
+  - [[-1, 9], 1, Concat, [1]] # cat head P5
+  - [-1, 3, C2f, [1024]] # 21 (P5/32-large)
+
+  - [[15, 18, 21], 1, Detect, [nc]] # Detect(P3, P4, P5)
--- a/federated_learning/yolov8_fed.py
+++ b/federated_learning/yolov8_fed.py
@@ -0,0 +1,252 @@
+import glob
+import os
+from pathlib import Path
+import json
+from pydoc import cli
+from threading import local
+
+import yaml
+from ultralytics import YOLO
+import copy
+import torch
+
+
+# ------------ 新增联邦学习工具函数 ------------
+def federated_avg(global_model, client_weights):
+    """联邦平均核心算法"""
+    # 计算总样本数
+    total_samples = sum(n for _, n in client_weights)
+    if total_samples == 0:
+        raise ValueError("Total number of samples must be positive.")
+
+    # DEBUG: global_dict
+    # print(global_model)
+
+    # 获取YOLO底层PyTorch模型参数
+    global_dict = global_model.model.state_dict()
+    # 提取所有客户端的 state_dict 和对应样本数
+    state_dicts, sample_counts = zip(*client_weights)
+
+    # 克隆参数并脱离计算图
+    global_dict_copy = {
+        k: v.clone().detach().requires_grad_(False) for k, v in global_dict.items()
+    }
+
+    # 聚合可训练且存在的参数
+    for key in global_dict_copy:
+        # if global_dict_copy[key].dtype != torch.float32:
+        #     continue
+        # if any(
+        #     x in key for x in ["running_mean", "running_var", "num_batches_tracked"]
+        # ):
+        #     continue
+        # 检查所有客户端是否包含当前键
+        all_clients_have_key = all(key in sd for sd in state_dicts)
+        if all_clients_have_key:
+            # 计算每个客户端的加权张量
+            # weighted_tensors = [
+            #     client_state[key].float() * (sample_count / total_samples)
+            #     for client_state, sample_count in zip(state_dicts, sample_counts)
+            # ]
+            weighted_tensors = []
+            for client_state, sample_count in zip(state_dicts, sample_counts):
+                weight = sample_count / total_samples  # 计算权重
+                weighted_tensor = client_state[key].float() * weight  # 加权张量
+                weighted_tensors.append(weighted_tensor)
+            # 聚合加权张量并更新全局参数
+            global_dict_copy[key] = torch.stack(weighted_tensors, dim=0).sum(dim=0)
+
+        # else:
+        #     print(f"错误: 键 {key} 在部分客户端缺失，已保留全局参数")
+        # 终止训练或记录日志
+        # raise KeyError(f"键 {key} 缺失")
+
+    # 加载回YOLO模型
+    global_model.model.load_state_dict(global_dict_copy, strict=True)
+
+    # global_model.model.train()
+    # with torch.no_grad():
+    #     global_model.model.load_state_dict(global_dict_copy, strict=True)
+
+    # 定义多个关键层
+    MONITOR_KEYS = [
+        "model.0.conv.weight",
+        "model.1.conv.weight",
+        "model.3.conv.weight",
+        "model.5.conv.weight",
+        "model.7.conv.weight",
+        "model.9.cv1.conv.weight",
+        "model.12.cv1.conv.weight",
+        "model.15.cv1.conv.weight",
+        "model.18.cv1.conv.weight",
+        "model.21.cv1.conv.weight",
+        "model.22.dfl.conv.weight",
+    ]
+
+    with open("aggregation_check.txt", "a") as f:
+        f.write("\n=== 参数聚合检查 ===\n")
+    for key in MONITOR_KEYS:
+        # if key not in global_dict:
+        #     continue
+        # if not all(key in sd for sd in state_dicts):
+        #     continue
+
+        # 计算聚合后均值
+        aggregated_mean = global_dict[key].mean().item()
+
+        # 计算各客户端均值
+        client_means = [sd[key].float().mean().item() for sd in state_dicts]
+        with open("aggregation_check.txt", "a") as f:
+            f.write(f"层 '{key}' 聚合后均值: {aggregated_mean:.6f}\n")
+            f.write(f"各客户端该层均值差异: {[f'{cm:.6f}' for cm in client_means]}\n")
+            f.write(f"客户端最大差异: {max(client_means) - min(client_means):.6f}\n\n")
+
+    return global_model
+
+
+# ------------ 修改训练流程 ------------
+def federated_train(num_rounds, clients_data):
+    # ========== 初始化指标记录 ==========
+    metrics = {
+        "round": [],
+        "val_mAP": [],  # 每轮验证集mAP
+        # "train_loss": [],  # 每轮平均训练损失
+        "client_mAPs": [],  # 各客户端本地模型在验证集上的mAP
+        "communication_cost": [],  # 每轮通信开销（MB）
+    }
+    # 初始化全局模型
+    device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+    global_model = (
+        YOLO("/home/image1325/DATA/Graduation-Project/federated_learning/yolov8n.yaml")
+        .load("/home/image1325/DATA/Graduation-Project/federated_learning/yolov8n.pt")
+        .to(device)
+    )
+    global_model.model.model[-1].nc = 1  # 设置检测类别数为1
+    # global_model.model.train.ema.enabled = False
+
+    # 克隆全局模型
+    local_model = copy.deepcopy(global_model)
+
+    for _ in range(num_rounds):
+        client_weights = []
+        # 各客户端的训练损失
+        # client_losses = []
+
+        # DEBUG: 检查全局模型参数
+        # global_dict = global_model.model.state_dict()
+        # print(global_dict.keys())
+
+        # 每个客户端本地训练
+        for data_path in clients_data:
+            # 统计本地训练样本数
+            with open(data_path, "r") as f:
+                config = yaml.safe_load(f)
+            #  Resolve img_dir relative to the YAML file's location
+            yaml_dir = os.path.dirname(data_path)
+            img_dir = os.path.join(
+                yaml_dir, config.get("train", data_path)
+            )  # 从配置文件中获取图像目录
+
+            # print(f"Image directory: {img_dir}")
+            num_samples = (
+                len(glob.glob(os.path.join(img_dir, "*.jpg")))
+                + len(glob.glob(os.path.join(img_dir, "*.png")))
+                + len(glob.glob(os.path.join(img_dir, "*.jpeg")))
+            )
+            # print(f"Number of images: {num_samples}")
+
+            local_model.model.load_state_dict(
+                global_model.model.state_dict(), strict=True
+            )
+
+            # 本地训练（保持你的原有参数设置）
+            local_model.train(
+                name=f"train{_ + 1}",  # 当前轮次
+                data=data_path,
+                # model=local_model,
+                epochs=16,  # 每轮本地训练多少个epoch
+                # save_period=16,
+                imgsz=768,  # 图像大小
+                verbose=False,  # 关闭冗余输出
+                batch=-1,  # 批大小
+                workers=6,  # 工作线程数
+            )
+
+            # 记录客户端训练损失
+            # client_loss = results.results_dict['train_loss']
+            # client_losses.append(client_loss)
+
+            # 收集模型参数及样本数
+            client_weights.append((local_model.model.state_dict(), num_samples))
+
+        # 聚合参数更新全局模型
+        global_model = federated_avg(global_model, client_weights)
+
+        # DEBUG: 检查全局模型参数
+        # keys = global_model.model.state_dict().keys()
+
+        # ========== 评估全局模型 ==========
+        # 复制全局模型以避免在评估时修改参数
+        val_model = copy.deepcopy(global_model)
+        # 评估全局模型在验证集上的性能
+        with torch.no_grad():
+            val_results = val_model.val(
+                data="/mnt/DATA/uav_dataset_old/UAVdataset/fed_data.yaml",  # 指定验证集配置文件
+                imgsz=768,  # 图像大小
+                batch=16,  # 批大小
+                verbose=False,  # 关闭冗余输出
+            )
+        # 丢弃评估模型
+        del val_model
+
+        # DEBUG: 检查全局模型参数
+        # if keys != global_model.model.state_dict().keys():
+        #     print("模型参数不一致！")
+
+        val_mAP = val_results.box.map  # 获取mAP@0.5
+
+        # 计算平均训练损失
+        # avg_train_loss = sum(client_losses) / len(client_losses)
+
+        # 计算通信开销（假设传输全部模型参数）
+        model_size = sum(p.numel() * 4 for p in global_model.model.parameters()) / (
+            1024**2
+        )  # MB
+
+        # 记录到指标容器
+        metrics["round"].append(_ + 1)
+        metrics["val_mAP"].append(val_mAP)
+        # metrics['train_loss'].append(avg_train_loss)
+        metrics["communication_cost"].append(model_size)
+        # 打印当前轮次结果
+        with open("aggregation_check.txt", "a") as f:
+            f.write(f"\n[Round {_ + 1}/{num_rounds}]\n")
+            f.write(f"Validation mAP@0.5: {val_mAP:.4f}\n")
+            # f.write(f"Average Train Loss: {avg_train_loss:.4f}")
+            f.write(f"Communication Cost: {model_size:.2f} MB\n\n")
+
+    return global_model, metrics
+
+
+if __name__ == "__main__":
+    # 联邦训练配置
+    clients_config = [
+        "/mnt/DATA/uav_fed/train1/train1.yaml",  # 客户端1数据路径
+        "/mnt/DATA/uav_fed/train2/train2.yaml",  # 客户端2数据路径
+    ]
+
+    # 使用本地数据集进行测试
+    # clients_config = [
+    #     "/home/image1325/DATA/Graduation-Project/dataset/train1/train1.yaml",
+    #     "/home/image1325/DATA/Graduation-Project/dataset/train2/train2.yaml",
+    # ]
+
+    # 运行联邦训练
+    final_model, metrics = federated_train(num_rounds=10, clients_data=clients_config)
+
+    # 保存最终模型
+    final_model.save("yolov8n_federated.pt")
+    # final_model.export(format="onnx")  # 导出为ONNX格式
+
+    with open("metrics.json", "w") as f:
+        json.dump(metrics, f, indent=4)
--- a/image_fusion/Image_Registration_test.py
+++ b/image_fusion/Image_Registration_test.py
@@ -0,0 +1,354 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+
+import time
+import argparse
+
+import cv2
+import numpy as np
+
+from ultralytics import YOLO
+from skimage.metrics import structural_similarity as ssim
+
+# 添加YOLOv8模型初始化
+yolo_model = YOLO("best.pt")  # 可替换为yolov8s/m/l等
+yolo_model.to('cuda')  # 启用GPU加速
+
+
+def calculate_en(img):
+    """计算信息熵（处理灰度图）"""
+    hist = cv2.calcHist([img], [0], None, [256], [0, 256])
+    hist = hist / hist.sum()
+    return -np.sum(hist * np.log2(hist + 1e-10))
+
+
+def calculate_sf(img):
+    """计算空间频率（处理灰度图）"""
+    rf = np.sqrt(np.mean(np.square(np.diff(img, axis=0))))
+    cf = np.sqrt(np.mean(np.square(np.diff(img, axis=1))))
+    return np.sqrt(rf ** 2 + cf ** 2)
+
+
+def calculate_mi(img1, img2):
+    """计算互信息（处理灰度图）"""
+    hist_2d = np.histogram2d(img1.ravel(), img2.ravel(), 256)[0]
+    pxy = hist_2d / hist_2d.sum()
+    px = np.sum(pxy, axis=1)
+    py = np.sum(pxy, axis=0)
+    return np.sum(pxy * np.log2(pxy / (px[:, None] * py[None, :] + 1e-10) + 1e-10))
+
+
+def calculate_ssim(img1, img2):
+    """计算SSIM（处理灰度图）"""
+    return ssim(img1, img2, data_range=255)
+
+
+# 裁剪线性RGB对比度拉伸：（去掉2%百分位以下的数，去掉98%百分位以上的数，上下百分位数一般相同，并设置输出上下限）
+def truncated_linear_stretch(image, truncated_value=2, maxout=255, min_out=0):
+    """
+    :param image:
+    :param truncated_value:
+    :param maxout:
+    :param min_out:
+    :return:
+    """
+    
+    def gray_process(gray, maxout=maxout, minout=min_out):
+        truncated_down = np.percentile(gray, truncated_value)
+        truncated_up = np.percentile(gray, 100 - truncated_value)
+        gray_new = ((maxout - minout) / (truncated_up - truncated_down)) * gray
+        gray_new[gray_new < minout] = minout
+        gray_new[gray_new > maxout] = maxout
+        return np.uint8(gray_new)
+    
+    (b, g, r) = cv2.split(image)
+    b = gray_process(b)
+    g = gray_process(g)
+    r = gray_process(r)
+    result = cv2.merge((b, g, r))  # 合并每一个通道
+    return result
+
+
+# RGB图片配准函数，采用白天的可见光与红外灰度图，计算两者Surf共同特征点，之间的仿射矩阵。
+def Images_matching(img_base, img_target):
+    """
+    :param img_base:
+    :param img_target:匹配图像
+    :return: 返回仿射矩阵
+    """
+    start = time.time()
+    orb = cv2.ORB_create()
+    
+    # 对可见光图像进行对比度拉伸
+    # img_base = truncated_linear_stretch(img_base)
+    
+    img_base = cv2.cvtColor(img_base, cv2.COLOR_BGR2GRAY)
+    sift = cv2.SIFT_create()
+    # 使用sift算子计算特征点和特征点周围的特征向量
+    st1 = time.time()
+    kp1, des1 = sift.detectAndCompute(img_base, None)  # 1136    1136, 64
+    kp2, des2 = sift.detectAndCompute(img_target, None)
+    en1 = time.time()
+    
+    # print(en1 - st1, "特征提取")
+    
+    # 进行KNN特征匹配
+    # FLANN_INDEX_KDTREE = 0  # 建立FLANN匹配器的参数
+    # indexParams = dict(algorithm=FLANN_INDEX_KDTREE, trees=5)  # 配置索引，密度树的数量为5
+    # searchParams = dict(checks=50)  # 指定递归次数
+    # flann = cv2.FlannBasedMatcher(indexParams, searchParams)  # 建立匹配器
+    # matches = flann.knnMatch(des1, des2, k=2)  # 得出匹配的关键点  list: 1136
+    # FLANN_INDEX_KDTREE = 1
+    # index_params = dict(algorithm=FLANN_INDEX_KDTREE, trees=5)
+    # search_params = dict(checks=50)
+    # flann = cv2.FlannBasedMatcher(index_params, search_params)
+    # matches = flann.knnMatch(des1, des2, k=2)
+    
+    st2 = time.time()
+    matcher = cv2.BFMatcher()
+    matches = matcher.knnMatch(des1, des2, k=2)
+    de2 = time.time()
+    # print(de2 - st2, "特征匹配")
+    good = []
+    # 提取优秀的特征点
+    for m, n in matches:
+        if m.distance < 0.75 * n.distance:  # 如果第一个邻近距离比第二个邻近距离的0.7倍小，则保留
+            good.append(m)  # 134
+    src_pts = np.array([kp1[m.queryIdx].pt for m in good])  # 查询图像的特征描述子索引  # 134, 2
+    dst_pts = np.array([kp2[m.trainIdx].pt for m in good])  # 训练(模板)图像的特征描述子索引
+    if len(src_pts) <= 4:
+        print("Not enough matches are found - {}/{}".format(len(good), 4))
+        return 0, None, 0
+    else:
+        print(len(dst_pts), len(src_pts), "配准坐标点")
+        H = cv2.findHomography(dst_pts, src_pts, cv2.RANSAC, 4)  # 生成变换矩阵  H[0]: 3, 3  H[1]: 134, 1
+        end = time.time()
+        times = end - start
+        # print("配准时间", times)
+        return 1, H[0], len(dst_pts)
+
+
+def fusions(img_vl, img_inf):
+    """
+    :param img_vl: 原图像
+    :param img_inf: 红外图像
+    :return:
+    """
+    img_YUV = cv2.cvtColor(img_vl, cv2.COLOR_BGR2YUV)  # 如果输入是BGR，需转换
+    # img_YUV = cv2.cvtColor(img_vl, cv2.COLOR_RGB2YUV)
+    y, u, v = cv2.split(img_YUV)  # 分离通道,获取Y通道
+    Yf = y * 0.5 + img_inf * 0.5
+    Yf = Yf.astype(np.uint8)
+    fusion = cv2.cvtColor(cv2.merge((Yf, u, v)), cv2.COLOR_YUV2RGB)
+    return fusion
+
+
+def removeBlackBorder(gray):
+    """
+    移除缝合后的图像的多余黑边
+    输入：
+        image：三维numpy矩阵，待处理图像
+    输出：
+        裁剪后的图像
+    """
+    threshold = 40  # 阈值
+    nrow = gray.shape[0]  # 获取图片尺寸
+    ncol = gray.shape[1]
+    rowc = gray[:, int(1 / 2 * nrow)]  # 无法区分黑色区域超过一半的情况
+    colc = gray[int(1 / 2 * ncol), :]
+    rowflag = np.argwhere(rowc > threshold)
+    colflag = np.argwhere(colc > threshold)
+    left, bottom, right, top = rowflag[0, 0], colflag[-1, 0], rowflag[-1, 0], colflag[0, 0]
+    # cv2.imshow('name', gray[left:right, top:bottom])  # 效果展示
+    cv2.waitKey(1)
+    return gray[left:right, top:bottom], left, right, top, bottom
+
+
+def main(matchimg_vi, matchimg_in):
+    """
+    :param matchimg_vi: 可见光图像
+    :param matchimg_in: 红外图像
+    :return: 融合好的图像（带检测结果）
+    """
+    try:
+        orimg_vi = matchimg_vi
+        orimg_in = matchimg_in
+        h, w = orimg_vi.shape[:2]  # 480 640
+        # (3, 3)//获取对应的配准坐标点
+        flag, H, dot = Images_matching(matchimg_vi, matchimg_in)
+        if flag == 0:
+            return 0, None, 0, 0.0, 0.0, 0.0, 0.0
+        else:
+            # 配准处理
+            matched_ni = cv2.warpPerspective(orimg_in, H, (w, h))
+            matched_ni, left, right, top, bottom = removeBlackBorder(matched_ni)
+            
+            # 裁剪可见光图像
+            # fusion = fusions(orimg_vi[left:right, top:bottom], matched_ni)
+            
+            # 不裁剪可见光图像
+            fusion = fusions(orimg_vi, matched_ni)
+            
+            # 转换为灰度计算指标
+            fusion_gray = cv2.cvtColor(fusion, cv2.COLOR_RGB2GRAY)
+            cropped_vi_gray = cv2.cvtColor(orimg_vi, cv2.COLOR_BGR2GRAY)
+            matched_ni_gray = matched_ni  # 红外图已经是灰度
+            
+            # 计算指标
+            en = calculate_en(fusion_gray)
+            sf = calculate_sf(fusion_gray)
+            mi_visible = calculate_mi(fusion_gray, cropped_vi_gray)
+            mi_infrared = calculate_mi(fusion_gray, matched_ni_gray)
+            mi_total = mi_visible + mi_infrared
+            
+            # 添加SSIM容错处理
+            try:
+                ssim_visible = calculate_ssim(fusion_gray, cropped_vi_gray)
+                ssim_infrared = calculate_ssim(fusion_gray, matched_ni_gray)
+                ssim_avg = (ssim_visible + ssim_infrared) / 2
+            except Exception as ssim_error:
+                print(f"SSIM计算错误: {ssim_error}")
+                ssim_avg = -1  # 用-1表示计算失败
+            
+            # YOLOv8目标检测
+            results = yolo_model(fusion)  # 输入融合后的图像
+            annotated_image = results[0].plot()  # 绘制检测框
+            
+            # 返回带检测结果的图像
+            return 1, annotated_image, dot, en, sf, mi_total, ssim_avg
+    except Exception as e:
+        print(f"Error in fusion/detection: {e}")
+        return 0, None, 0, 0.0, 0.0, 0.0, 0.0
+
+
+def parse_args():
+    # 输入可见光和红外图像路径
+    visible_image_path = "./test/visible/visibleI0195.jpg"  # 可见光图片路径
+    infrared_image_path = "./test/infrared/infraredI0195.jpg"  # 红外图片路径
+    # 输入可见光和红外视频路径
+    visible_video_path = "./test/visible.mp4"  # 可见光视频路径
+    infrared_video_path = "./test/infrared.mp4"  # 红外视频路径
+    
+    """解析命令行参数"""
+    parser = argparse.ArgumentParser(description='图像融合与目标检测')
+    
+    parser.add_argument('--mode', type=str, choices=['video', 'image'], default='image',
+                        help='输入模式：video（视频流） 或 image（静态图片）')
+    
+    # 区分摄像头或视频文件
+    parser.add_argument('--source', type=str, choices=['camera', 'file'],
+                        help='视频输入类型：camera（摄像头）或 file（视频文件）')
+    
+    # 视频模式参数
+    parser.add_argument('--video1', type=str, default=visible_video_path,
+                        help='可见光视频路径（仅在source=file时需要）')
+    parser.add_argument('--video2', type=str, default=infrared_video_path,
+                        help='红外视频路径（仅在source=file时需要）')
+    
+    # 摄像头模式参数
+    parser.add_argument('--camera_id1', type=int, default=0,
+                        help='可见光摄像头ID（仅在source=camera时需要，默认0）')
+    parser.add_argument('--camera_id2', type=int, default=1,
+                        help='红外摄像头ID（仅在source=camera时需要，默认1）')
+    parser.add_argument('--output', type=str, default='output.mp4',
+                        help='输出视频路径（仅在video模式需要）')
+    
+    # 图片模式参数
+    parser.add_argument('--visible', type=str, default=visible_image_path,
+                        help='可见光图片路径（仅在image模式需要）')
+    parser.add_argument('--infrared', type=str, default=infrared_image_path,
+                        help='红外图片路径（仅在image模式需要）')
+    
+    return parser.parse_args()
+
+
+if __name__ == '__main__':
+    time_all = 0
+    dots = 0
+    i = 0
+    args = parse_args()
+    
+    if args.mode == 'video':
+        if args.source == 'file':
+            # ========== 视频流处理模式 ==========
+            if not args.video1 or not args.video2:
+                raise ValueError("视频模式需要指定 --video1 和 --video2 参数")
+            capture = cv2.VideoCapture(args.video2)
+            capture2 = cv2.VideoCapture(args.video1)
+        elif args.source == 'camera':
+            # ========== 摄像头处理模式 ==========
+            capture = cv2.VideoCapture(args.camera_id1)
+            capture2 = cv2.VideoCapture(args.camera_id2)
+        else:
+            raise ValueError("必须指定 --source 参数（camera 或 file）")
+        
+        # 公共视频处理逻辑
+        fps = capture.get(cv2.CAP_PROP_FPS) if args.source == 'file' else 30
+        fourcc = cv2.VideoWriter_fourcc(*'XVID')
+        out = cv2.VideoWriter(args.output, fourcc, fps, (640, 480))
+        
+        while True:
+            ret1, frame_vi = capture.read()  # 可见光帧
+            ret2, frame_ir = capture2.read()  # 红外帧
+            if not ret1 or not ret2:
+                break
+            
+            # 红外图像转灰度
+            frame_ir_gray = cv2.cvtColor(frame_ir, cv2.COLOR_BGR2GRAY)
+            
+            # 执行融合与检测
+            flag, fusion, _ = main(frame_vi, frame_ir_gray)
+            
+            if flag == 1:
+                cv2.imshow("Fusion with YOLOv8 Detection", fusion)
+                out.write(fusion)
+            
+            if cv2.waitKey(1) == ord('q'):
+                break
+        
+        # 释放资源
+        capture.release()
+        capture2.release()
+        out.release()
+        cv2.destroyAllWindows()
+    
+    elif args.mode == 'image':
+        # ========= 图片处理模式 ==========
+        if not args.infrared or not args.visible:
+            raise ValueError("图片模式需要指定 --visible 和 --infrared 参数")
+        
+        # 读取图像
+        img_visible = cv2.imread(args.visible)
+        img_infrared = cv2.imread(args.infrared)
+        
+        if img_visible is None or img_infrared is None:
+            print("Error: 图片加载失败，请检查路径！")
+            exit()
+        
+        # 转换为灰度图（红外图像处理）
+        img_inf_gray = cv2.cvtColor(img_infrared, cv2.COLOR_BGR2GRAY)
+        
+        # 执行融合与检测
+        flag, fusion_result, dot, en, sf, mi, ssim_val = main(img_visible, img_inf_gray)
+        
+        if flag == 1:
+            # 展示评价指标
+            print("\n======== 融合质量评价 ========")
+            print(f"信息熵（EN）: {en:.2f}")
+            print(f"空间频率（SF）: {sf:.2f}")
+            print(f"互信息（MI）: {mi:.2f}")
+            
+            # 条件显示SSIM
+            if ssim_val >= 0:
+                print(f"结构相似性（SSIM）: {ssim_val:.4f}")
+            else:
+                print("结构相似性（SSIM）: 计算失败（已跳过）")
+            
+            print(f"配准点数: {dot}")
+            # 显示并保存结果
+            # cv2.imshow("Fusion with Detection", fusion_result)
+            cv2.imwrite("output/fusion_result.jpg", fusion_result)
+            # cv2.waitKey(0)
+            # cv2.destroyAllWindows()
+        else:
+            print("融合失败！")
--- a/image_fusion/Img_Registration.py
+++ b/image_fusion/Img_Registration.py
@@ -0,0 +1,147 @@
+# -*- coding: utf-8 -*-
+# @Time :
+# @Author :
+import cv2
+import numpy as np
+
+sift = cv2.SIFT_create()
+
+
+def compuerSift2GetPts(img1, img2):
+    # sift 查找关键点，关键点 And 描述
+    kp1, des1 = sift.detectAndCompute(img1, None)
+    kp2, des2 = sift.detectAndCompute(img2, None)
+    
+    matcher = cv2.BFMatcher()
+    raw_matches = matcher.knnMatch(des1, des2, k=2)
+    good_matches = []
+    ratio = 0.75
+    for m1, m2 in raw_matches:
+        # 如果最接近和次接近的比值大于一个既定的值，那么我们保留这个最接近的值，认为它和其匹配的点为good_match
+        if m1.distance < ratio * m2.distance:
+            good_matches.append([m1])
+    matches = cv2.drawMatchesKnn(img1, kp1, img2, kp2, good_matches, None, flags=2)
+    ptsA = np.float32([kp1[m[0].queryIdx].pt for m in good_matches]).reshape(-1, 1, 2)
+    ptsB = np.float32([kp2[m[0].trainIdx].pt for m in good_matches]).reshape(-1, 1, 2)
+    
+    ransacReprojThreshold = 4
+    #  单应性矩阵可以将一张图通过旋转、变换等方式与另一张图对齐
+    # print(len(ptsA), len(ptsB))
+    if len(ptsA) == 0: return ptsA, ptsB, 0
+    H, status = cv2.findHomography(ptsA, ptsB, cv2.RANSAC, ransacReprojThreshold)
+    cv2.imshow("matcher", matches)
+    cv2.waitKey(100)
+    
+    return ptsA, ptsB, 1
+
+
+def findBestDistanceAndPts(ptsA, ptsB):
+    x_dct = {}
+    y_dct = {}
+    best_x, best_y = int(ptsA[0][0][0] - ptsB[0][0][0]), int(ptsA[0][0][1] - ptsB[0][0][1])
+    x_cnt, y_cnt = 0, 0
+    for i in range(len(ptsA)):
+        # print(ptsA[i], '        ', ptsB[i])
+        x_dis = int(ptsA[i][0][0] - ptsB[i][0][0])
+        y_dis = int(ptsA[i][0][1] - ptsB[i][0][1])
+        # print(x_dis)
+        if x_dis in x_dct:
+            x_dct.update({x_dis: int(x_dct.get(x_dis) + 1)})
+            if x_dct.get(x_dis) > x_cnt:
+                best_x = x_dis
+                x_cnt = x_dct.get(x_dis)
+            # print(x_dct.get(x_dis))
+        else:
+            x_dct.update({x_dis: 1})
+            # print(x_dct.get(x_dis))
+        # print(y_dis)
+        if y_dis in y_dct:
+            y_dct.update({y_dis: int(y_dct.get(y_dis) + 1)})
+            if y_dct.get(y_dis) > y_cnt:
+                best_y = y_dis
+                y_cnt = y_dct.get(y_dis)
+            # print(y_dct.get(y_dis))
+        else:
+            y_dct.update({y_dis: 1})
+            # print(y_dct.get(y_dis))
+    print(best_x, best_y)
+    
+    pt = []
+    ptb = []
+    for i in range(len(ptsA)):
+        x_dis = int(ptsA[i][0][0] - ptsB[i][0][0])
+        y_dis = int(ptsA[i][0][1] - ptsB[i][0][1])
+        if abs(best_x - x_dis) <= 0:
+            pt.append([ptsA[i][0][0], ptsA[i][0][1]])
+    # print(pt)
+    return pt, best_x, best_y
+
+
+def minDistanceHasXy(ptsA, ptsB):
+    dct = {}
+    cnt = 0
+    best = 's'
+    for i in range(len(ptsA)):
+        disx = int(ptsA[i][0][0] - ptsB[i][0][0] + 0.5)
+        disy = int(ptsA[i][0][1] - ptsB[i][0][1] + 0.5)
+        s = str(disx) + ',' + str(disy)
+        # print(s)
+        if s in dct:
+            dct.updata({s: int(dct.get(s) + 1)})
+            if dct.get(s) >= cnt:
+                cnt = dct.get(s)
+                best = s
+                print(s)
+        else:
+            dct.update({s: int(1)})
+    for i, j in dct.items():
+        print(i, j)
+    print(best)
+
+
+def detectImg(img1, img2, pta, best_x, best_y):
+    # print(pta)
+    min_x = int(min(x[0] for x in pta))
+    max_x = int(max(x[0] for x in pta))
+    min_y = int(min(x[1] for x in pta))
+    max_y = int(max(x[1] for x in pta))
+    # print(min_x, max_x)
+    # print(min_x - best_x, max_x - best_x)
+    # print(min_y, max_y)
+    # print(min_y - best_y, max_y - best_y)
+    newimg1 = img1[min_y: max_y, min_x: max_x]
+    newimg2 = img2[min_y - best_y: max_y - best_y, min_x - best_x: max_x - best_x]
+    # cv2.imshow("newimg1", newimg1)
+    # cv2.imshow("newimg2", newimg2)
+    # cv2.waitKey(0)
+    return newimg1, newimg2
+
+
+if __name__ == '__main__':
+    j = 0
+    for i in range(20, 4771, 1):
+        print(i)
+        path1 = './data/907dat/gray/camera1-' + str(i) + '.png'
+        path2 = './data/907dat/color/camera0-' + str(i) + '.png'
+        img1 = cv2.imread(path1)
+        img2 = cv2.imread(path2)
+        if (img1 is None or img2 is None): continue
+        PtsA, PtsB, f = compuerSift2GetPts(img1, img2)
+        if (f == 0): continue
+        pt, best_x, best_y = findBestDistanceAndPts(PtsA, PtsB)
+        newimg1, newimg2 = detectImg(img1, img2, pt, best_x, best_y)
+        if newimg1.shape[0] < 10 or newimg1.shape[1] < 10: continue
+        print(newimg1.shape, newimg2.shape)
+        # newimg1 = cv2.resize(newimg1, (320, 240))
+        # newimg2 = cv2.resize(newimg2, (320, 240))
+        wirtePath1 = './result/dat_result_2/gray/camera1-' + str(j) + '.png'
+        wirtePath2 = './result/dat_result_2/color/camera0-' + str(j) + '.png'
+        if newimg1.shape[0] > 255 and newimg1.shape[1] > 255 and newimg1.shape == newimg2.shape:
+            # cv2.imwrite(wirtePath1, newimg1)
+            # cv2.imwrite(wirtePath2, newimg2)
+            j += 1
+            cv2.imshow("newimg1", newimg1)
+            cv2.imshow("newimg2", newimg2)
+            cv2.waitKey()
+    print(j)
+    pass
--- a/image_fusion/init.py
+++ b/image_fusion/init.py
--- a/image_fusion/output/fusion_result.jpg
+++ b/image_fusion/output/fusion_result.jpg
--- a/image_fusion/test/infrared.jpg
+++ b/image_fusion/test/infrared.jpg
--- a/image_fusion/test/visible.jpg
+++ b/image_fusion/test/visible.jpg
--- a/requirements.txt
+++ b/requirements.txt
@@ -0,0 +1,41 @@
+certifi==2025.1.31
+charset-normalizer==3.4.1
+colorama==0.4.6
+contourpy==1.3.2
+cycler==0.12.1
+filelock==3.18.0
+fonttools==4.57.0
+fsspec==2025.3.2
+idna==3.10
+Jinja2==3.1.6
+kiwisolver==1.4.8
+MarkupSafe==3.0.2
+matplotlib==3.10.1
+mpmath==1.3.0
+networkx==3.4.2
+numpy==2.1.1
+opencv-python==4.11.0.86
+packaging==24.2
+pandas==2.2.3
+pillow==11.2.1
+psutil==7.0.0
+py-cpuinfo==9.0.0
+pyparsing==3.2.3
+python-dateutil==2.9.0.post0
+pytz==2025.2
+PyYAML==6.0.2
+requests==2.32.3
+scipy==1.15.2
+seaborn==0.13.2
+setuptools==78.1.0
+six==1.17.0
+sympy==1.13.1
+torch==2.6.0+cu124
+torchaudio==2.6.0+cu124
+torchvision==0.21.0+cu124
+tqdm==4.67.1
+typing_extensions==4.13.2
+tzdata==2025.2
+ultralytics==8.3.111
+ultralytics-thop==2.0.14
+urllib3==2.4.0
--- a/yolov8/yolov8.yaml
+++ b/yolov8/yolov8.yaml
@@ -0,0 +1,6 @@
+train: /mnt/DATA/dataset/uav_dataset/train/images/
+val:   /mnt/DATA/dataset/uav_dataset/val/images/
+test:  /mnt/DATA/dataset/test2/images/
+# number of classes
+nc:    1
+names: ['uav']
--- a/yolov8/yolov8_train.py
+++ b/yolov8/yolov8_train.py
@@ -0,0 +1,13 @@
+from ultralytics import YOLO
+
+# 加载预训练模型
+model = YOLO('../yolov8n.pt')
+
+# 开始训练
+model.train(
+    data='./yolov8.yaml',  # 数据配置文件路径
+    epochs=320,                 # 训练轮数
+    batch=-1,                  # 批量大小
+    imgsz=640,                 # 输入图片大小
+    device=0                   # 使用的设备（0 表示 GPU，'cpu' 表示 CPU）
+)
Author	SHA1	Message	Date
Yunhao Meng	2e7cf69512	增加说明	2025-05-10 17:23:06 +08:00
Yunhao Meng	76240a12e6	增加联邦学习评价指标。bugfix: 修复训练模型参数聚合问题	2025-05-10 17:22:56 +08:00
Yunhao Meng	98321aa7d5	训练模型配置	2025-05-10 16:19:00 +08:00
Yunhao Meng	d39aa31651	删除无用文件	2025-05-10 16:18:37 +08:00
Yunhao Meng	f127ae2852	增加联邦学习指标；fix：Pytorch 加载模型不匹配	2025-05-07 10:41:36 +08:00
Yunhao Meng	3a65d89315	ignore .vscode	2025-05-07 10:41:06 +08:00
Yunhao Meng	2a3e5b17e7	yolov8对比训练	2025-05-05 17:30:12 +08:00
Yunhao Meng	c57c8f3552	忽略训练结果和pt文件	2025-05-05 17:29:58 +08:00
Yunhao Meng	310131d876	文件结构调整	2025-05-05 17:03:41 +08:00
myh	ba4508507b	评价指标优化	2025-04-22 21:41:58 +08:00
myh	89d8f4c0df	添加评价指标	2025-04-22 16:35:29 +08:00
myh	d1ed958db5	删除实例模块	2025-04-22 16:35:19 +08:00
myh	abd033b831	训练命令	2025-04-22 16:35:10 +08:00
myh	69482e6a3f	修改参数，符合Linux路径要求	2025-04-22 14:56:45 +08:00
myh	9f827af58e	删除无用样例	2025-04-22 14:51:15 +08:00
myh	338a5e07e8	修改参数，使其符合训练数据集	2025-04-22 00:19:43 +08:00
myh	9d99b00e55	更改最小测试示例	2025-04-21 23:50:41 +08:00
myh	dd0e0d869c	忽略缓存文件	2025-04-21 23:50:12 +08:00
myh	8cd6df4527	数据集测试样例配置	2025-04-21 22:27:19 +08:00
myh	132ed64136	数据集测试样例	2025-04-21 22:26:52 +08:00
myh	be1e3627e7	评价指标测试	2025-04-21 17:51:38 +08:00
myh	d139f5afcf	评价指标	2025-04-21 17:51:32 +08:00
myh	428790ab91	项目重构	2025-04-20 16:36:41 +08:00
myh	65e10f3e7d	忽略模型文件	2025-04-20 15:25:05 +08:00
myh	960b66a692	python包新加__init__文件	2025-04-20 15:21:19 +08:00
myh	ef3d521e4a	测试数据集文件	2025-04-20 15:20:40 +08:00
myh	3b80f237fa	联邦平均算法：结合yolov8	2025-04-20 15:20:16 +08:00
myh	f320e79702	更改项目结构	2025-04-20 15:19:55 +08:00
myh	34a5247dd2	联邦学习示例项目：更改结构	2025-04-20 15:19:24 +08:00
myh	1930e1b96b	格式化	2025-04-19 20:31:12 +08:00
myh	5095dbe6c0	格式化代码	2025-04-19 20:09:42 +08:00
myh	554c7e6083	删除冗余算法	2025-04-19 20:09:17 +08:00
myh	0d84bba234	测试图片	2025-04-19 19:01:07 +08:00
myh	c81de41b3e	添加三种不同模式	2025-04-19 18:59:35 +08:00
myh	b8ffb902b3	忽略三方库文件夹	2025-04-19 18:59:14 +08:00
myh	da36a8fc09	添加参数控制列表	2025-04-19 18:58:44 +08:00
myh	45db741f35	删除无用文件	2025-04-19 13:08:24 +08:00
myh	5df0e15baf	静态图片测试	2025-04-19 13:08:15 +08:00
myh	5e72ac28cc	yolo模型文件	2025-04-19 13:07:47 +08:00
myh	5b61b48d50	依赖包	2025-04-19 13:07:37 +08:00
myh	160bb2e365	测试图片	2025-04-19 13:07:28 +08:00
myh	65ee0565c2	集成YOLOv8	2025-04-18 22:51:46 +08:00
myh	ca275ba74b	图像融合模块	2025-04-18 22:15:37 +08:00
myh	1cfc280f34	联邦学习模块	2025-04-18 22:15:25 +08:00
myh	f5e527e02e	排除.idea文件夹	2025-04-18 22:06:27 +08:00
				`@@ -0,0 +1 @@`
				`0 0.36328125 0.525 0.7109375 0.8083333333333333`
				`@@ -0,0 +1 @@`
				`0 0.6934895833333333 0.6527777777777778 0.008854166666666666 0.018518518518518517`
				`@@ -0,0 +1 @@`
				`0 0.5109375 0.5322916666666667 0.125 0.13958333333333334`
				`@@ -0,0 +1 @@`
				`0 0.55078125 0.296875 0.0890625 0.08958333333333333`