5 月之前 · 35d39c6ce5
--- a/models/line_detect/line_detect.py
+++ b/models/line_detect/line_detect.py
@@ -173,7 +173,7 @@ class LineDetect(BaseDetectionNet):
 
				 
			
 
				         if line_predictor is None:
			
 
				             keypoint_dim_reduced = 512  # == keypoint_layers[-1]
			
 
				-            line_predictor = LinePredictor(keypoint_dim_reduced, num_keypoints)
			
 
				+            line_predictor = LinePredictor(keypoint_dim_reduced)
			
 
				 
			
 
				 
			
 
				         self.roi_heads.line_roi_pool = line_roi_pool
			
@@ -305,13 +305,13 @@ class LineHeads(nn.Sequential):
 
				 
			
 
				 
			
 
				 class LinePredictor(nn.Module):
			
 
				-    def __init__(self, in_channels, num_keypoints):
			
 
				+    def __init__(self, in_channels, out_channels=1 ):
			
 
				         super().__init__()
			
 
				         input_features = in_channels
			
 
				         deconv_kernel = 4
			
 
				         self.kps_score_lowres = nn.ConvTranspose2d(
			
 
				             input_features,
			
 
				-            num_keypoints,
			
 
				+            out_channels,
			
 
				             deconv_kernel,
			
 
				             stride=2,
			
 
				             padding=deconv_kernel // 2 - 1,
			
@@ -319,10 +319,12 @@ class LinePredictor(nn.Module):
 
				         nn.init.kaiming_normal_(self.kps_score_lowres.weight, mode="fan_out", nonlinearity="relu")
			
 
				         nn.init.constant_(self.kps_score_lowres.bias, 0)
			
 
				         self.up_scale = 2
			
 
				-        self.out_channels = num_keypoints
			
 
				+        self.out_channels = out_channels
			
 
				 
			
 
				     def forward(self, x):
			
 
				+        print(f'before kps_score_lowres x:{x.shape}')
			
 
				         x = self.kps_score_lowres(x)
			
 
				+        print(f'kps_score_lowres x:{x.shape}')
			
 
				         return torch.nn.functional.interpolate(
			
 
				             x, scale_factor=float(self.up_scale), mode="bilinear", align_corners=False, recompute_scale_factor=False
			
 
				         )
			
--- a/models/line_detect/roi_heads.py
+++ b/models/line_detect/roi_heads.py
@@ -1,5 +1,6 @@
 
				 from typing import Dict, List, Optional, Tuple
			
 
				 
			
 
				+import matplotlib.pyplot as plt
			
 
				 import torch
			
 
				 import torch.nn.functional as F
			
 
				 import torchvision
			
@@ -128,6 +129,138 @@ def maskrcnn_loss(mask_logits, proposals, gt_masks, gt_labels, mask_matched_idxs
 
				     return mask_loss
			
 
				 
			
 
				 
			
 
				+def line_points_to_heatmap(keypoints, rois, heatmap_size):
			
 
				+    # type: (Tensor, Tensor, int) -> Tuple[Tensor, Tensor]
			
 
				+    print(f'rois:{rois.shape}')
			
 
				+    print(f'heatmap_size:{heatmap_size}')
			
 
				+    offset_x = rois[:, 0]
			
 
				+    offset_y = rois[:, 1]
			
 
				+    scale_x = heatmap_size / (rois[:, 2] - rois[:, 0])
			
 
				+    scale_y = heatmap_size / (rois[:, 3] - rois[:, 1])
			
 
				+
			
 
				+    offset_x = offset_x[:, None]
			
 
				+    offset_y = offset_y[:, None]
			
 
				+    scale_x = scale_x[:, None]
			
 
				+    scale_y = scale_y[:, None]
			
 
				+
			
 
				+    print(f'keypoints.shape:{keypoints.shape}')
			
 
				+    # batch_size, num_keypoints, _ = keypoints.shape
			
 
				+
			
 
				+    x = keypoints[..., 0]
			
 
				+    y = keypoints[..., 1]
			
 
				+
			
 
				+    # gs=generate_gaussian_heatmaps(x,y,512,1.0)
			
 
				+    # print(f'gs_heatmap shape:{gs.shape}')
			
 
				+    #
			
 
				+    # show_heatmap(gs,'target')
			
 
				+
			
 
				+    x_boundary_inds = x == rois[:, 2][:, None]
			
 
				+    y_boundary_inds = y == rois[:, 3][:, None]
			
 
				+
			
 
				+    x = (x - offset_x) * scale_x
			
 
				+    x = x.floor().long()
			
 
				+    y = (y - offset_y) * scale_y
			
 
				+    y = y.floor().long()
			
 
				+
			
 
				+    x[x_boundary_inds] = heatmap_size - 1
			
 
				+    y[y_boundary_inds] = heatmap_size - 1
			
 
				+    # print(f'heatmaps x:{x}')
			
 
				+    # print(f'heatmaps y:{y}')
			
 
				+
			
 
				+    valid_loc = (x >= 0) & (y >= 0) & (x < heatmap_size) & (y < heatmap_size)
			
 
				+    vis = keypoints[..., 2] > 0
			
 
				+    valid = (valid_loc & vis).long()
			
 
				+
			
 
				+    gs_heatmap=generate_gaussian_heatmaps(x,y,heatmap_size,1.0)
			
 
				+
			
 
				+    # show_heatmap(gs_heatmap[0],'feature')
			
 
				+
			
 
				+    print(f'gs_heatmap:{gs_heatmap.shape}')
			
 
				+    #
			
 
				+    # lin_ind = y * heatmap_size + x
			
 
				+    # print(f'lin_ind:{lin_ind.shape}')
			
 
				+    # heatmaps = lin_ind * valid
			
 
				+
			
 
				+    return gs_heatmap
			
 
				+
			
 
				+
			
 
				+def generate_gaussian_heatmaps(xs, ys, heatmap_size, sigma=2.0, device='cuda'):
			
 
				+    """
			
 
				+    为一组点生成并合并高斯热图。
			
 
				+
			
 
				+    Args:
			
 
				+        xs (Tensor): 形状为 (N, 2) 的所有点的 x 坐标
			
 
				+        ys (Tensor): 形状为 (N, 2) 的所有点的 y 坐标
			
 
				+        heatmap_size (int): 热图大小 H=W
			
 
				+        sigma (float): 高斯核标准差
			
 
				+        device (str): 设备类型 ('cpu' or 'cuda')
			
 
				+
			
 
				+    Returns:
			
 
				+        Tensor: 形状为 (H, W) 的合并后的热图
			
 
				+    """
			
 
				+
			
 
				+    assert xs.shape == ys.shape, "x and y must have the same shape"
			
 
				+    N = xs.shape[0]
			
 
				+    print(f'N:{N}')
			
 
				+
			
 
				+    # 创建网格
			
 
				+    grid_y, grid_x = torch.meshgrid(
			
 
				+        torch.arange(heatmap_size, device=device),
			
 
				+        torch.arange(heatmap_size, device=device),
			
 
				+        indexing='ij'
			
 
				+    )
			
 
				+
			
 
				+    # print(f'heatmap_size:{heatmap_size}')
			
 
				+    # 初始化输出热图
			
 
				+    combined_heatmap = torch.zeros((N,heatmap_size, heatmap_size), device=device)
			
 
				+    for i in range(N):
			
 
				+
			
 
				+        mu_x1 = xs[i, 0].clamp(0, heatmap_size - 1).item()
			
 
				+        mu_y1 = ys[i, 0].clamp(0, heatmap_size - 1).item()
			
 
				+
			
 
				+        # 计算距离平方
			
 
				+        dist1 = (grid_x - mu_x1) ** 2 + (grid_y - mu_y1) ** 2
			
 
				+
			
 
				+        # 计算高斯分布
			
 
				+        heatmap1 = torch.exp(-dist1 / (2 * sigma ** 2))
			
 
				+
			
 
				+        mu_x2 = xs[i, 1].clamp(0, heatmap_size - 1).item()
			
 
				+        mu_y2 = ys[i, 1].clamp(0, heatmap_size - 1).item()
			
 
				+
			
 
				+        # 计算距离平方
			
 
				+        dist2 = (grid_x - mu_x2) ** 2 + (grid_y - mu_y2) ** 2
			
 
				+
			
 
				+        # 计算高斯分布
			
 
				+        heatmap2 = torch.exp(-dist2 / (2 * sigma ** 2))
			
 
				+
			
 
				+        heatmap=heatmap1+heatmap2
			
 
				+
			
 
				+        # 将当前热图累加到结果中
			
 
				+        combined_heatmap[i]= heatmap
			
 
				+
			
 
				+    return combined_heatmap
			
 
				+
			
 
				+
			
 
				+# 显示热图的函数
			
 
				+def show_heatmap(heatmap, title="Heatmap"):
			
 
				+    """
			
 
				+    使用 matplotlib 显示热图。
			
 
				+
			
 
				+    Args:
			
 
				+        heatmap (Tensor): 要显示的热图张量
			
 
				+        title (str): 图表标题
			
 
				+    """
			
 
				+    # 如果在 GPU 上，首先将其移动到 CPU 并转换为 numpy 数组
			
 
				+    if heatmap.is_cuda:
			
 
				+        heatmap = heatmap.cpu().numpy()
			
 
				+    else:
			
 
				+        heatmap = heatmap.numpy()
			
 
				+
			
 
				+    plt.imshow(heatmap, cmap='hot', interpolation='nearest')
			
 
				+    plt.colorbar()
			
 
				+    plt.title(title)
			
 
				+    plt.show()
			
 
				+
			
 
				 def keypoints_to_heatmap(keypoints, rois, heatmap_size):
			
 
				     # type: (Tensor, Tensor, int) -> Tuple[Tensor, Tensor]
			
 
				     offset_x = rois[:, 0]
			
@@ -158,6 +291,7 @@ def keypoints_to_heatmap(keypoints, rois, heatmap_size):
 
				     vis = keypoints[..., 2] > 0
			
 
				     valid = (valid_loc & vis).long()
			
 
				 
			
 
				+
			
 
				     lin_ind = y * heatmap_size + x
			
 
				     heatmaps = lin_ind * valid
			
 
				 
			
@@ -298,31 +432,50 @@ def heatmaps_to_keypoints(maps, rois):
 
				 def lines_point_pair_loss(line_logits, proposals, gt_lines, line_matched_idxs):
			
 
				     # type: (Tensor, List[Tensor], List[Tensor], List[Tensor]) -> Tensor
			
 
				     N, K, H, W = line_logits.shape
			
 
				+    batch_size=len(proposals)
			
 
				+    print(f'lines_point_pair_loss line_logits.shape:{line_logits.shape}')
			
 
				     if H != W:
			
 
				         raise ValueError(
			
 
				             f"line_logits height and width (last two elements of shape) should be equal. Instead got H = {H} and W = {W}"
			
 
				         )
			
 
				     discretization_size = H
			
 
				     heatmaps = []
			
 
				+    gs_heatmaps=[]
			
 
				     valid = []
			
 
				     for proposals_per_image, gt_kp_in_image, midx in zip(proposals, gt_lines, line_matched_idxs):
			
 
				+        print(f'proposals_per_image:{proposals_per_image.shape}')
			
 
				         kp = gt_kp_in_image[midx]
			
 
				-        heatmaps_per_image, valid_per_image = keypoints_to_heatmap(kp, proposals_per_image, discretization_size)
			
 
				-        heatmaps.append(heatmaps_per_image.view(-1))
			
 
				-        valid.append(valid_per_image.view(-1))
			
 
				+        gs_heatmaps_per_img = line_points_to_heatmap(kp, proposals_per_image, discretization_size)
			
 
				+        gs_heatmaps.append(gs_heatmaps_per_img)
			
 
				+        # print(f'heatmaps_per_image:{heatmaps_per_image.shape}')
			
 
				 
			
 
				-    line_targets = torch.cat(heatmaps, dim=0)
			
 
				-    valid = torch.cat(valid, dim=0).to(dtype=torch.uint8)
			
 
				-    valid = torch.where(valid)[0]
			
 
				+
			
 
				+        # heatmaps.append(heatmaps_per_image.view(-1))
			
 
				+
			
 
				+        # valid.append(valid_per_image.view(-1))
			
 
				+
			
 
				+    # line_targets = torch.cat(heatmaps, dim=0)
			
 
				+    gs_heatmaps=torch.cat(gs_heatmaps,dim=0)
			
 
				+    print(f'gs_heatmaps:{gs_heatmaps.shape}, line_logits.shape:{line_logits.squeeze(1).shape}')
			
 
				+    # print(f'line_targets:{line_targets.shape},{line_targets}')
			
 
				+
			
 
				+    # valid = torch.cat(valid, dim=0).to(dtype=torch.uint8)
			
 
				+    # valid = torch.where(valid)[0]
			
 
				+
			
 
				+    # print(f' line_targets[valid]:{line_targets[valid]}')
			
 
				 
			
 
				     # torch.mean (in binary_cross_entropy_with_logits) doesn't
			
 
				     # accept empty tensors, so handle it sepaartely
			
 
				-    if line_targets.numel() == 0 or len(valid) == 0:
			
 
				-        return line_logits.sum() * 0
			
 
				+    # if line_targets.numel() == 0 or len(valid) == 0:
			
 
				+    #     return line_logits.sum() * 0
			
 
				 
			
 
				-    line_logits = line_logits.view(N * K, H * W)
			
 
				+    # line_logits = line_logits.view(N * K, H * W)
			
 
				+    # print(f'line_logits[valid]:{line_logits[valid].shape}')
			
 
				+    line_logits=line_logits.squeeze(1)
			
 
				+
			
 
				+    # line_loss = F.cross_entropy(line_logits[valid], line_targets[valid])
			
 
				+    line_loss=F.cross_entropy(line_logits,gs_heatmaps)
			
 
				 
			
 
				-    line_loss = F.cross_entropy(line_logits[valid], line_targets[valid])
			
 
				     return line_loss
			
 
				 
			
 
				 def line_inference(x, boxes):
			
@@ -353,6 +506,7 @@ def keypointrcnn_loss(keypoint_logits, proposals, gt_keypoints, keypoint_matched
 
				     for proposals_per_image, gt_kp_in_image, midx in zip(proposals, gt_keypoints, keypoint_matched_idxs):
			
 
				         kp = gt_kp_in_image[midx]
			
 
				         heatmaps_per_image, valid_per_image = keypoints_to_heatmap(kp, proposals_per_image, discretization_size)
			
 
				+
			
 
				         heatmaps.append(heatmaps_per_image.view(-1))
			
 
				         valid.append(valid_per_image.view(-1))
			
 
				 
			
@@ -860,7 +1014,7 @@ class RoIHeads(nn.Module):
 
				         if self.has_line():
			
 
				             print(f'roi_heads forward has_line()!!!!')
			
 
				             line_proposals = [p["boxes"] for p in result]
			
 
				-            print(f'line_proposals:{len(line_proposals)}')
			
 
				+            print(f'boxes_proposals:{len(line_proposals)}')
			
 
				 
			
 
				             # if line_proposals is None or len(line_proposals) == 0:
			
 
				             #     # è¿åç©ºç¹å¾æèè·³è¿è¯¥é¨åè®¡ç®
			
@@ -892,10 +1046,15 @@ class RoIHeads(nn.Module):
 
				                 else:
			
 
				                     pos_matched_idxs = None
			
 
				 
			
 
				+            print(f'line_proposals:{len(line_proposals)}')
			
 
				             line_features = self.line_roi_pool(features, line_proposals, image_shapes)
			
 
				+            print(f'line_features from line_roi_pool:{line_features.shape}')
			
 
				             line_features = self.line_head(line_features)
			
 
				+            print(f'line_features from line_head:{line_features.shape}')
			
 
				             line_logits = self.line_predictor(line_features)
			
 
				 
			
 
				+            print(f'line_logits:{line_logits.shape}')
			
 
				+
			
 
				             loss_line = {}
			
 
				             if self.training:
			
 
				                 if targets is None or pos_matched_idxs is None:
			
--- a/models/line_detect/train.yaml
+++ b/models/line_detect/train.yaml
@@ -1,6 +1,6 @@
 
				 io:
			
 
				   logdir: train_results
			
 
				-  datadir: G:\python_ws_g\data\250612
			
 
				+  datadir: \\192.168.50.222/share/rlq/datasets/250612
			
 
				 #  datadir: D:\python\PycharmProjects\data_20250223\0423_
			
 
				 #  datadir: I:\datasets\wirenet_1000
			
 
				 
			
@@ -10,7 +10,7 @@ io:
 
				 train_params:
			
 
				   resume_from:
			
 
				   num_workers: 8
			
 
				-  batch_size: 2
			
 
				+  batch_size: 4
			
 
				   max_epoch: 80000
			
 
				   optim:
			
 
				     name: Adam