4 hónapja · ce4aa432ca
--- a/models/line_detect/heads/arc/__init__.py
+++ b/models/line_detect/heads/arc/__init__.py
--- a/models/line_detect/heads/circle/__init__.py
+++ b/models/line_detect/heads/circle/__init__.py
--- a/models/line_detect/heads/head_losses.py
+++ b/models/line_detect/heads/head_losses.py
@@ -3,6 +3,7 @@ from matplotlib import pyplot as plt
 
				 
			
 
				 import torch.nn.functional as F
			
 
				 from torch import nn
			
 
				+from torch.cuda import device
			
 
				 
			
 
				 
			
 
				 class DiceLoss(nn.Module):
			
@@ -438,12 +439,211 @@ def heatmaps_to_points(maps, rois,num_points=2):
 
				 
			
 
				     return point_preds,point_end_scores
			
 
				 
			
 
				+# 分4块
			
 
				+def find_max_heat_point_in_each_part(feature_map, box):
			
 
				+    """
			
 
				+    在给定的特征图上，根据box中心点往上移3，往右移3作为新的中心点，
			
 
				+    并将特征图划分为4个部分，之后在每个部分中找到热度值最大的点。
			
 
				+
			
 
				+    Args:
			
 
				+        feature_map (torch.Tensor): 形状为 [C, H, W] 的特征图
			
 
				+        box (torch.Tensor): 形状为 [4] 的边界框 [x_min, y_min, x_max, y_max]
			
 
				+
			
 
				+    Returns:
			
 
				+        list: 每个区域中热度最高的点的位置和其对应的热度值 [(y1, x1, heat1), ..., (y4, x4, heat4)]
			
 
				+    """
			
 
				+    device = feature_map.device
			
 
				+    C, H, W = feature_map.shape
			
 
				+
			
 
				+    # 计算box的中心点(cx, cy)
			
 
				+    cx = (box[0] + box[2]) // 2
			
 
				+    cy = (box[1] + box[3]) // 2
			
 
				+
			
 
				+    # 偏移中心点
			
 
				+    new_cx = min(max(cx + 3, 0), W - 1)  # 向右移3
			
 
				+    new_cy = min(max(cy - 3, 0), H - 1)  # 向上移3
			
 
				+
			
 
				+    # 创建坐标网格
			
 
				+    y_coords, x_coords = torch.meshgrid(
			
 
				+        torch.arange(H, device=device), torch.arange(W, device=device), indexing='ij'
			
 
				+    )
			
 
				+
			
 
				+    # 划分四个区域
			
 
				+    mask_q1 = (y_coords < new_cy) & (x_coords < new_cx)  # 左上
			
 
				+    mask_q2 = (y_coords < new_cy) & (x_coords >= new_cx)  # 右上
			
 
				+    mask_q3 = (y_coords >= new_cy) & (x_coords < new_cx)  # 左下
			
 
				+    mask_q4 = (y_coords >= new_cy) & (x_coords >= new_cx)  # 右下
			
 
				+
			
 
				+    # def process_region(mask):
			
 
				+    #     region = feature_map[:, :, mask].squeeze()
			
 
				+    #     if len(region.shape) == 0:  # 如果区域为空，则跳过
			
 
				+    #         return None, None
			
 
				+    #     # 找到最大热度值的点及其位置
			
 
				+    #     (y, x), heat_val = non_maximum_suppression(region[0])
			
 
				+    #     # 将相对坐标转换回全局坐标
			
 
				+    #     y_global = y + torch.where(mask)[0].min().item()
			
 
				+    #     x_global = x + torch.where(mask)[1].min().item()
			
 
				+    #     return (y_global, x_global), heat_val
			
 
				+    #
			
 
				+    # results = []
			
 
				+    # for mask in [mask_q1, mask_q2, mask_q3, mask_q4]:
			
 
				+    #     point, heat_val = process_region(mask)
			
 
				+    #     if point is not None:
			
 
				+    #         # results.append((point[0], point[1], heat_val))
			
 
				+    #         results.append((point[0], point[1]))
			
 
				+    #     else:
			
 
				+    #         results.append(None)
			
 
				+    masks = [mask_q1, mask_q2, mask_q3, mask_q4]
			
 
				+    results = []
			
 
				+
			
 
				+    # 假设使用第一个通道作为热力图
			
 
				+    heatmap = feature_map[0]  # [H, W]
			
 
				+
			
 
				+    def process_region(mask):
			
 
				+        # 应用 mask，只保留该区域
			
 
				+        masked_heatmap = heatmap.clone()  # 复制以避免修改原数据
			
 
				+        masked_heatmap[~mask] = 0  # 非区域置0
			
 
				+
			
 
				+        def non_maximum_suppression_2d(heatmap, kernel_size=3):
			
 
				+            """
			
 
				+            对 2D 热力图做非极大值抑制，保留局部最大值点。
			
 
				+
			
 
				+            Args:
			
 
				+                heatmap (torch.Tensor): [H, W]，输入热力图
			
 
				+                kernel_size (int): 池化窗口大小，用于比较是否为局部最大值
			
 
				+
			
 
				+            Returns:
			
 
				+                torch.Tensor: 与 heatmap 同形状的 mask，局部最大值位置为 True
			
 
				+            """
			
 
				+            pad = (kernel_size - 1) // 2
			
 
				+            max_pool = torch.nn.MaxPool2d(kernel_size=kernel_size, stride=1, padding=pad)
			
 
				+            maxima = max_pool(heatmap.unsqueeze(0)).squeeze(0)
			
 
				+            # 局部最大值且值大于0
			
 
				+            peaks = (heatmap == maxima) & (heatmap > 0)
			
 
				+            return peaks
			
 
				+
			
 
				+        # 1. 先做 NMS 得到候选局部极大值点
			
 
				+        nms_mask = non_maximum_suppression_2d(masked_heatmap, kernel_size=3)  # [H, W] bool
			
 
				+        candidate_peaks = masked_heatmap * nms_mask.float()  # 只保留 NMS 后的峰值
			
 
				+
			
 
				+        # 2. 找出所有候选点中值最大的一个
			
 
				+        if candidate_peaks.max() <= 0:
			
 
				+            return None
			
 
				+
			
 
				+        # 找到最大值的位置
			
 
				+        max_val, max_idx = torch.max(candidate_peaks.view(-1), dim=0)
			
 
				+        y, x = divmod(max_idx.item(), W)
			
 
				+
			
 
				+        return (x, y)  # 返回 (y, x)
			
 
				+
			
 
				+    for mask in masks:
			
 
				+        point = process_region(mask)
			
 
				+        results.append(point)
			
 
				+
			
 
				+    return results
			
 
				+
			
 
				+
			
 
				+def non_maximum_suppression_2d(heatmap, kernel_size=3):
			
 
				+    pad = (kernel_size - 1) // 2
			
 
				+    max_pool = torch.nn.MaxPool2d(kernel_size=kernel_size, stride=1, padding=pad)
			
 
				+    maxima = max_pool(heatmap.unsqueeze(0)).squeeze(0)
			
 
				+    peaks = (heatmap == maxima) & (heatmap > 0)
			
 
				+    return peaks
			
 
				+
			
 
				+def find_max_heat_point_in_edge_centers(feature_map, box):
			
 
				+
			
 
				+    device = feature_map.device
			
 
				+    C, H, W = feature_map.shape
			
 
				+
			
 
				+    # ¼ÆËã box ÖÐÐÄ
			
 
				+    cx = (box[0] + box[2]) / 2
			
 
				+    cy = (box[1] + box[3]) / 2
			
 
				+
			
 
				+    # ¸ù¾Ý box ¿í¸ß¼ÆËã¾Å¹¬¸ñ·Ö½çÏß
			
 
				+    box_width = box[2] - box[0]
			
 
				+    box_height = box[3] - box[1]
			
 
				+
			
 
				+    x_left = cx - box_width / 6
			
 
				+    x_right = cx + box_width / 6
			
 
				+    y_top = cy - box_height / 6
			
 
				+    y_bottom = cy + box_height / 6
			
 
				+
			
 
				+    # ´´½¨Íø¸ñ
			
 
				+    y_coords, x_coords = torch.meshgrid(
			
 
				+        torch.arange(H, device=device),
			
 
				+        torch.arange(W, device=device),
			
 
				+        indexing='ij'
			
 
				+    )
			
 
				+
			
 
				+    # ¶¨ÒåËÄ¸ö¡°±ßÖÐ¡±ÇøÓòµÄ mask
			
 
				+    mask1 = (x_coords < x_left) & (y_coords < y_top)
			
 
				+    mask_top_middle    = (x_coords >= x_left) & (x_coords < x_right) & (y_coords < y_top)
			
 
				+    mask3 = (x_coords >= x_right) & (y_coords < y_top)
			
 
				+
			
 
				+    mask_left_middle = (x_coords < x_left) & (y_coords >= y_top) & (y_coords < y_bottom)
			
 
				+    mask_right_middle  = (x_coords >= x_right) & (y_coords >= y_top) & (y_coords < y_bottom)
			
 
				+
			
 
				+    mask4 = (x_coords < x_left) & (y_coords >= y_bottom)
			
 
				+    mask_bottom_middle = (x_coords >= x_left) & (x_coords < x_right) & (y_coords >= y_bottom)
			
 
				+    mask_right_bottom = (x_coords >= x_right) & (y_coords >= y_bottom)
			
 
				+
			
 
				+    # masks = [
			
 
				+    #     # mask1,
			
 
				+    #     mask_top_middle,
			
 
				+    #     # mask3,
			
 
				+    #     mask_left_middle,
			
 
				+    #     mask_right_middle,
			
 
				+    #     # mask4,
			
 
				+    #     mask_bottom_middle,
			
 
				+    #     mask_right_bottom
			
 
				+    # ]
			
 
				+
			
 
				+    masks = [
			
 
				+        mask_top_middle,
			
 
				+        mask_right_middle,
			
 
				+        mask_bottom_middle,
			
 
				+        mask_left_middle
			
 
				+    ]
			
 
				+
			
 
				+    # Ê¹ÓÃµÚÒ»¸öÍ¨µÀ×÷ÎªÈÈÁ¦Í¼
			
 
				+    heatmap = feature_map[0]  # [H, W]
			
 
				+
			
 
				+    results = []
			
 
				+
			
 
				+    for mask in masks:
			
 
				+        masked_heatmap = heatmap.clone()
			
 
				+        masked_heatmap[~mask] = 0  # ·ÇÄ¿±êÇøÓòÖÃ 0
			
 
				+
			
 
				+        # # NMS ÒÖÖÆ
			
 
				+        # nms_mask = non_maximum_suppression_2d(masked_heatmap, kernel_size=3)
			
 
				+        # candidate_peaks = masked_heatmap * nms_mask.float()
			
 
				+        #
			
 
				+        # if candidate_peaks.max() <= 0:
			
 
				+        #     results.append(None)
			
 
				+        #     continue
			
 
				+        #
			
 
				+        # # ÕÒ×î´óÖµÎ»ÖÃ
			
 
				+        # max_val, max_idx = torch.max(candidate_peaks.view(-1), dim=0)
			
 
				+        # y, x = divmod(max_idx.item(), W)
			
 
				+        flatten_point_roi_map = masked_heatmap.reshape(1, -1)
			
 
				+        point_score, point_index = torch.topk(flatten_point_roi_map, k=1)
			
 
				+        point_x =point_index % W
			
 
				+        point_y = torch.div(point_index - point_x, W, rounding_mode="floor")
			
 
				+
			
 
				+        results.append((point_x, point_y))
			
 
				+
			
 
				+    return results  # [(y_top, x_top), (y_right, x_right), (y_bottom, x_bottom), (y_left, x_left)]
			
 
				+
			
 
				+
			
 
				+
			
 
				 def heatmaps_to_circle_points(maps, rois,num_points=2):
			
 
				 
			
 
				 
			
 
				     point_preds = torch.zeros((len(rois), 4, 2), dtype=torch.float32, device=maps.device)
			
 
				     point_end_scores = torch.zeros((len(rois),4, 1), dtype=torch.float32, device=maps.device)
			
 
				 
			
 
				+    print(f'rois in heatmaps_to_circle_points:{type(rois),  rois.shape}')   # <class 'torch.Tensor'>
			
 
				+
			
 
				     print(f'heatmaps_to_lines:{maps.shape}')
			
 
				     point_maps=maps[:,0]
			
 
				     print(f'point_map:{point_maps.shape}')
			
@@ -452,18 +652,24 @@ def heatmaps_to_circle_points(maps, rois,num_points=2):
 
				         point_roi_map = point_maps[i].unsqueeze(0)
			
 
				         print(f'point_roi_map:{point_roi_map.shape}')
			
 
				         # roi_map_probs = scores_to_probs(roi_map.copy())
			
 
				-        w = point_roi_map.shape[2]
			
 
				-        flatten_point_roi_map = non_maximum_suppression(point_roi_map).reshape(1, -1)
			
 
				-        point_score, point_index = torch.topk(flatten_point_roi_map, k=num_points)
			
 
				-        print(f'point index:{point_index}')
			
 
				-        # pos = roi_map.reshape(num_keypoints, -1).argmax(dim=1)
			
 
				-
			
 
				-        point_x =point_index % w
			
 
				-        point_y = torch.div(point_index - point_x, w, rounding_mode="floor")
			
 
				-
			
 
				 
			
 
				-        point_preds[i, :,0] = point_x
			
 
				-        point_preds[i, :,1] = point_y
			
 
				+        # w = point_roi_map.shape[2]
			
 
				+        # flatten_point_roi_map = non_maximum_suppression(point_roi_map).reshape(1, -1)
			
 
				+        # print(f'non_maximum_suppression :{non_maximum_suppression(point_roi_map).shape}')
			
 
				+        # point_score, point_index = torch.topk(flatten_point_roi_map, k=num_points)
			
 
				+        # print(f'point index:{point_index}')
			
 
				+        # point_x =point_index % w
			
 
				+        # point_y = torch.div(point_index - point_x, w, rounding_mode="floor")
			
 
				+        # print(f'point_x:{point_x}, point_y:{point_y}')
			
 
				+        # point_preds[i, :, 0] = point_x
			
 
				+        # point_preds[i, :, 1] = point_y
			
 
				+        roi1=rois[i]
			
 
				+        result_points = find_max_heat_point_in_edge_centers(non_maximum_suppression(point_roi_map), roi1)
			
 
				+
			
 
				+        point_preds[i, :]=torch.tensor(result_points)
			
 
				+
			
 
				+        point_x = [point[0] for point in result_points]
			
 
				+        point_y = [point[1] for point in result_points]
			
 
				 
			
 
				         point_end_scores[i, :,0] = point_roi_map[torch.arange(1, device=point_roi_map.device), point_y, point_x]
			
 
				 
			
--- a/models/line_detect/heads/line/__init__.py
+++ b/models/line_detect/heads/line/__init__.py
--- a/models/line_detect/heads/point/__init__.py
+++ b/models/line_detect/heads/point/__init__.py
--- a/models/line_detect/line_detect.py
+++ b/models/line_detect/line_detect.py
@@ -351,9 +351,9 @@ def linedetect_newresnet18fpn(
 
				     # weights = LineNet_ResNet50_FPN_Weights.verify(weights)
			
 
				     # weights_backbone = ResNet50_Weights.verify(weights_backbone)
			
 
				     if num_classes is None:
			
 
				-        num_classes = 4
			
 
				+        num_classes = 5
			
 
				     if num_points is None:
			
 
				-        num_points = 3
			
 
				+        num_points = 4
			
 
				 
			
 
				     size=512
			
 
				     backbone =resnet18fpn()
			
@@ -378,7 +378,8 @@ def linedetect_newresnet18fpn(
 
				                        rpn_anchor_generator=anchor_generator, box_roi_pool=roi_pooler,
			
 
				                        detect_point=False,
			
 
				                        detect_line=False,
			
 
				-                       detect_arc=True,
			
 
				+                       detect_arc=False,
			
 
				+                       detect_circle=True,
			
 
				 
			
 
				                        **kwargs)
			
 
				 
			
--- a/models/line_detect/train.yaml
+++ b/models/line_detect/train.yaml
@@ -7,7 +7,7 @@ io:
 
				 #  datadir: /data/share/rlq/datasets/250718caisegangban
			
 
				 
			
 
				 #  datadir: /data/share/rlq/datasets/singepoint_Dataset0709_2
			
 
				-  datadir: /data/share/zyh/data/rgb_4point/a_dataset
			
 
				+  datadir: \\192.168.50.222/share/rlq/datasets/guanban_circle
			
 
				 #  datadir: \\192.168.50.222/share/rlq/datasets/singepoint_Dataset0709_2
			
 
				 #  datadir: \\192.168.50.222/share/rlq/datasets/250718caisegangban
			
 
				   data_type: rgb
			
--- a/models/line_detect/train_demo.py
+++ b/models/line_detect/train_demo.py
@@ -17,8 +17,8 @@ if __name__ == '__main__':
 
				     # model = lineDetect_resnet18_fpn()
			
 
				 
			
 
				     # model=linedetect_resnet18_fpn()
			
 
				-    # model=linedetect_newresnet18fpn(num_points=3)
			
 
				-    model=linedetect_newresnet50fpn(num_points=4)
			
 
				+    model=linedetect_newresnet18fpn(num_points=4)
			
 
				+    # model=linedetect_newresnet50fpn(num_points=4)
			
 
				     # model = linedetect_newresnet101fpn(num_points=3)
			
 
				     # model = linedetect_newresnet152fpn(num_points=3)
			
 
				     # model.load_weights(save_path=r'/home/admin/projects/MultiVisionModels/models/line_detect/train_results/20250711_114046/weights/best_val.pth')