5 maanden geleden · 5338e7af68
--- a/models/line_detect/loi_heads.py
+++ b/models/line_detect/loi_heads.py
@@ -6,7 +6,7 @@ import torch.nn.functional as F
 
				 import torchvision
			
 
				 # from scipy.optimize import linear_sum_assignment
			
 
				 from torch import nn, Tensor
			
 
				-from  libs.vision_libs.ops import boxes as box_ops, roi_align
			
 
				+from libs.vision_libs.ops import boxes as box_ops, roi_align
			
 
				 
			
 
				 import libs.vision_libs.models.detection._utils as det_utils
			
 
				 
			
@@ -129,19 +129,77 @@ def maskrcnn_loss(mask_logits, proposals, gt_masks, gt_labels, mask_matched_idxs
 
				     )
			
 
				     return mask_loss
			
 
				 
			
 
				+def normalize_tensor(t):
			
 
				+    return (t - t.min()) / (t.max() - t.min() + 1e-6)
			
 
				+
			
 
				+def line_length(lines):
			
 
				+    """
			
 
				+    计算每条线段的长度
			
 
				+    lines: [N, 2, 2] 表示 N 条线段，每条线段由两个点组成
			
 
				+    返回: [N]
			
 
				+    """
			
 
				+    return torch.norm(lines[:, 1] - lines[:, 0], dim=-1)
			
 
				+
			
 
				+def line_direction(lines):
			
 
				+    """
			
 
				+    计算每条线段的单位方向向量
			
 
				+    lines: [N, 2, 2]
			
 
				+    返回: [N, 2] 单位方向向量
			
 
				+    """
			
 
				+    vec = lines[:, 1] - lines[:, 0]
			
 
				+    return F.normalize(vec, dim=-1)
			
 
				+
			
 
				+def angle_loss_cosine(pred_dir, gt_dir):
			
 
				+    """
			
 
				+    使用 cosine similarity 计算方向差异
			
 
				+    pred_dir: [N, 2]
			
 
				+    gt_dir: [N, 2]
			
 
				+    返回: [N]
			
 
				+    """
			
 
				+    cos_sim = torch.sum(pred_dir * gt_dir, dim=-1).clamp(-1.0, 1.0)
			
 
				+    return 1.0 - cos_sim  # 或者 torch.acos(cos_sim) / pi 也可
			
 
				+
			
 
				+
			
 
				+def line_length(lines):
			
 
				+        """
			
 
				+        计算每条线段的长度
			
 
				+        lines: [N, 2, 2] 表示 N 条线段，每条线段由两个点组成
			
 
				+        返回: [N]
			
 
				+        """
			
 
				+        return torch.norm(lines[:, 1] - lines[:, 0], dim=-1)
			
 
				+
			
 
				+def line_direction(lines):
			
 
				+        """
			
 
				+        计算每条线段的单位方向向量
			
 
				+        lines: [N, 2, 2]
			
 
				+        返回: [N, 2] 单位方向向量
			
 
				+        """
			
 
				+        vec = lines[:, 1] - lines[:, 0]
			
 
				+        return F.normalize(vec, dim=-1)
			
 
				+
			
 
				+def angle_loss_cosine(pred_dir, gt_dir):
			
 
				+        """
			
 
				+        使用 cosine similarity 计算方向差异
			
 
				+        pred_dir: [N, 2]
			
 
				+        gt_dir: [N, 2]
			
 
				+        返回: [N]
			
 
				+        """
			
 
				+        cos_sim = torch.sum(pred_dir * gt_dir, dim=-1).clamp(-1.0, 1.0)
			
 
				+        return 1.0 - cos_sim  # 或者 torch.acos(cos_sim) / pi 也可
			
 
				+
			
 
				 def line_points_to_heatmap(keypoints, rois, heatmap_size):
			
 
				-    # type: (Tensor, Tensor, int) -> Tuple[Tensor, Tensor]
			
 
				+    # type: (Tensor, Tensor, int) -> Tensor
			
 
				     print(f'rois:{rois.shape}')
			
 
				     print(f'heatmap_size:{heatmap_size}')
			
 
				-    offset_x = rois[:, 0]
			
 
				-    offset_y = rois[:, 1]
			
 
				-    scale_x = heatmap_size / (rois[:, 2] - rois[:, 0])
			
 
				-    scale_y = heatmap_size / (rois[:, 3] - rois[:, 1])
			
 
				-
			
 
				-    offset_x = offset_x[:, None]
			
 
				-    offset_y = offset_y[:, None]
			
 
				-    scale_x = scale_x[:, None]
			
 
				-    scale_y = scale_y[:, None]
			
 
				+    # offset_x = rois[:, 0]
			
 
				+    # offset_y = rois[:, 1]
			
 
				+    # scale_x = heatmap_size / (rois[:, 2] - rois[:, 0])
			
 
				+    # scale_y = heatmap_size / (rois[:, 3] - rois[:, 1])
			
 
				+    #
			
 
				+    # offset_x = offset_x[:, None]
			
 
				+    # offset_y = offset_y[:, None]
			
 
				+    # scale_x = scale_x[:, None]
			
 
				+    # scale_y = scale_y[:, None]
			
 
				 
			
 
				     print(f'keypoints.shape:{keypoints.shape}')
			
 
				     # batch_size, num_keypoints, _ = keypoints.shape
			
@@ -149,28 +207,29 @@ def line_points_to_heatmap(keypoints, rois, heatmap_size):
 
				     x = keypoints[..., 0]
			
 
				     y = keypoints[..., 1]
			
 
				 
			
 
				-    gs=generate_gaussian_heatmaps(x,y,heatmap_size,1.0)
			
 
				+    gs = generate_gaussian_heatmaps(x, y, heatmap_size, 1.0)
			
 
				     # show_heatmap(gs[0],'target')
			
 
				-    all_roi_heatmap=[]
			
 
				-    for roi ,heatmap in zip(rois,gs):
			
 
				+    all_roi_heatmap = []
			
 
				+    for roi, heatmap in zip(rois, gs):
			
 
				         # print(f'heatmap:{heatmap.shape}')
			
 
				-        heatmap=heatmap.unsqueeze(0)
			
 
				+        heatmap = heatmap.unsqueeze(0)
			
 
				         x1, y1, x2, y2 = map(int, roi)
			
 
				         roi_heatmap = torch.zeros_like(heatmap)
			
 
				-        roi_heatmap[..., y1:y2+1, x1:x2+1]=heatmap[..., y1:y2+1, x1:x2+1]
			
 
				+        roi_heatmap[..., y1:y2 + 1, x1:x2 + 1] = heatmap[..., y1:y2 + 1, x1:x2 + 1]
			
 
				         # show_heatmap(roi_heatmap,'roi_heatmap')
			
 
				         all_roi_heatmap.append(roi_heatmap)
			
 
				 
			
 
				-    all_roi_heatmap=torch.cat(all_roi_heatmap)
			
 
				+    all_roi_heatmap = torch.cat(all_roi_heatmap)
			
 
				     print(f'all_roi_heatmap:{all_roi_heatmap.shape}')
			
 
				 
			
 
				-
			
 
				     return all_roi_heatmap
			
 
				 
			
 
				 
			
 
				 """
			
 
				 修改适配的原结构的点 转热图，适用于带roi_pool版本的
			
 
				 """
			
 
				+
			
 
				+
			
 
				 def line_points_to_heatmap_(keypoints, rois, heatmap_size):
			
 
				     # type: (Tensor, Tensor, int) -> Tuple[Tensor, Tensor]
			
 
				     print(f'rois:{rois.shape}')
			
@@ -193,7 +252,6 @@ def line_points_to_heatmap_(keypoints, rois, heatmap_size):
 
				 
			
 
				     # gs=generate_gaussian_heatmaps(x,y,512,1.0)
			
 
				 
			
 
				-
			
 
				     # print(f'gs_heatmap shape:{gs.shape}')
			
 
				     #
			
 
				     # show_heatmap(gs[0],'target')
			
@@ -215,9 +273,9 @@ def line_points_to_heatmap_(keypoints, rois, heatmap_size):
 
				     vis = keypoints[..., 2] > 0
			
 
				     valid = (valid_loc & vis).long()
			
 
				 
			
 
				-    gs_heatmap=generate_gaussian_heatmaps(x,y,heatmap_size,1.0)
			
 
				+    gs_heatmap = generate_gaussian_heatmaps(x, y, heatmap_size, 1.0)
			
 
				 
			
 
				-    show_heatmap(gs_heatmap[0],'feature')
			
 
				+    show_heatmap(gs_heatmap[0], 'feature')
			
 
				 
			
 
				     # print(f'gs_heatmap:{gs_heatmap.shape}')
			
 
				     #
			
@@ -256,9 +314,8 @@ def generate_gaussian_heatmaps(xs, ys, heatmap_size, sigma=2.0, device='cuda'):
 
				 
			
 
				     # print(f'heatmap_size:{heatmap_size}')
			
 
				     # 初始化输出热图
			
 
				-    combined_heatmap = torch.zeros((N,heatmap_size, heatmap_size), device=device)
			
 
				+    combined_heatmap = torch.zeros((N, heatmap_size, heatmap_size), device=device)
			
 
				     for i in range(N):
			
 
				-
			
 
				         mu_x1 = xs[i, 0].clamp(0, heatmap_size - 1).item()
			
 
				         mu_y1 = ys[i, 0].clamp(0, heatmap_size - 1).item()
			
 
				 
			
@@ -277,10 +334,10 @@ def generate_gaussian_heatmaps(xs, ys, heatmap_size, sigma=2.0, device='cuda'):
 
				         # 计算高斯分布
			
 
				         heatmap2 = torch.exp(-dist2 / (2 * sigma ** 2))
			
 
				 
			
 
				-        heatmap=heatmap1+heatmap2
			
 
				+        heatmap = heatmap1 + heatmap2
			
 
				 
			
 
				         # 将当前热图累加到结果中
			
 
				-        combined_heatmap[i]= heatmap
			
 
				+        combined_heatmap[i] = heatmap
			
 
				 
			
 
				     return combined_heatmap
			
 
				 
			
@@ -305,6 +362,7 @@ def show_heatmap(heatmap, title="Heatmap"):
 
				     plt.title(title)
			
 
				     plt.show()
			
 
				 
			
 
				+
			
 
				 def keypoints_to_heatmap(keypoints, rois, heatmap_size):
			
 
				     # type: (Tensor, Tensor, int) -> Tuple[Tensor, Tensor]
			
 
				     offset_x = rois[:, 0]
			
@@ -335,7 +393,6 @@ def keypoints_to_heatmap(keypoints, rois, heatmap_size):
 
				     vis = keypoints[..., 2] > 0
			
 
				     valid = (valid_loc & vis).long()
			
 
				 
			
 
				-
			
 
				     lin_ind = y * heatmap_size + x
			
 
				     heatmaps = lin_ind * valid
			
 
				 
			
@@ -343,7 +400,7 @@ def keypoints_to_heatmap(keypoints, rois, heatmap_size):
 
				 
			
 
				 
			
 
				 def _onnx_heatmaps_to_keypoints(
			
 
				-    maps, maps_i, roi_map_width, roi_map_height, widths_i, heights_i, offset_x_i, offset_y_i
			
 
				+        maps, maps_i, roi_map_width, roi_map_height, widths_i, heights_i, offset_x_i, offset_y_i
			
 
				 ):
			
 
				     num_keypoints = torch.scalar_tensor(maps.size(1), dtype=torch.int64)
			
 
				 
			
@@ -395,7 +452,7 @@ def _onnx_heatmaps_to_keypoints(
 
				 
			
 
				 @torch.jit._script_if_tracing
			
 
				 def _onnx_heatmaps_to_keypoints_loop(
			
 
				-    maps, rois, widths_ceil, heights_ceil, widths, heights, offset_x, offset_y, num_keypoints
			
 
				+        maps, rois, widths_ceil, heights_ceil, widths, heights, offset_x, offset_y, num_keypoints
			
 
				 ):
			
 
				     xy_preds = torch.zeros((0, 3, int(num_keypoints)), dtype=torch.float32, device=maps.device)
			
 
				     end_scores = torch.zeros((0, int(num_keypoints)), dtype=torch.float32, device=maps.device)
			
@@ -473,11 +530,14 @@ def heatmaps_to_keypoints(maps, rois):
 
				         end_scores[i, :] = roi_map[torch.arange(num_keypoints, device=roi_map.device), y_int, x_int]
			
 
				 
			
 
				     return xy_preds.permute(0, 2, 1), end_scores
			
 
				+
			
 
				+
			
 
				 def non_maximum_suppression(a):
			
 
				     ap = F.max_pool2d(a, 3, stride=1, padding=1)
			
 
				     mask = (a == ap).float().clamp(min=0.0)
			
 
				     return a * mask
			
 
				 
			
 
				+
			
 
				 def heatmaps_to_lines(maps, rois):
			
 
				     """Extract predicted keypoint locations from heatmaps. Output has shape
			
 
				     (#rois, 4, #keypoints) with the 4 rows corresponding to (x, y, logit, prob)
			
@@ -488,54 +548,36 @@ def heatmaps_to_lines(maps, rois):
 
				     # consistency with keypoints_to_heatmap_labels by using the conversion from
			
 
				     # Heckbert 1990: c = d + 0.5, where d is a discrete coordinate and c is a
			
 
				     # continuous coordinate.
			
 
				-    offset_x = rois[:, 0]
			
 
				-    offset_y = rois[:, 1]
			
 
				-
			
 
				-    widths = rois[:, 2] - rois[:, 0]
			
 
				-    heights = rois[:, 3] - rois[:, 1]
			
 
				-    widths = widths.clamp(min=1)
			
 
				-    heights = heights.clamp(min=1)
			
 
				-    widths_ceil = widths.ceil()
			
 
				-    heights_ceil = heights.ceil()
			
 
				-
			
 
				-    num_keypoints = maps.shape[1]
			
 
				-
			
 
				     xy_preds = torch.zeros((len(rois), 3, 2), dtype=torch.float32, device=maps.device)
			
 
				     end_scores = torch.zeros((len(rois), 2), dtype=torch.float32, device=maps.device)
			
 
				 
			
 
				     for i in range(len(rois)):
			
 
				-        roi_map_width = int(widths_ceil[i].item())
			
 
				-        roi_map_height = int(heights_ceil[i].item())
			
 
				-        width_correction = widths[i] / roi_map_width
			
 
				-        height_correction = heights[i] / roi_map_height
			
 
				-        roi_map = F.interpolate(
			
 
				-            maps[i][:, None], size=(roi_map_height, roi_map_width), mode="bicubic", align_corners=False
			
 
				-        )[:, 0]
			
 
				+        roi_map = maps[i]
			
 
				+
			
 
				         print(f'roi_map:{roi_map.shape}')
			
 
				         # roi_map_probs = scores_to_probs(roi_map.copy())
			
 
				         w = roi_map.shape[2]
			
 
				-        flatten_map=non_maximum_suppression(roi_map).reshape(1, -1)
			
 
				+        flatten_map = non_maximum_suppression(roi_map).reshape(1, -1)
			
 
				         score, index = torch.topk(flatten_map, k=2)
			
 
				 
			
 
				         print(f'index:{index}')
			
 
				 
			
 
				         # pos = roi_map.reshape(num_keypoints, -1).argmax(dim=1)
			
 
				 
			
 
				-        pos=index
			
 
				+        pos = index
			
 
				 
			
 
				-        x_int = pos % w
			
 
				+        # x_int = pos % w
			
 
				+        #
			
 
				+        # y_int = torch.div(pos - x_int, w, rounding_mode="floor")
			
 
				 
			
 
				-        y_int = torch.div(pos - x_int, w, rounding_mode="floor")
			
 
				+        x = pos % w
			
 
				 
			
 
				+        y = torch.div(pos - x, w, rounding_mode="floor")
			
 
				 
			
 
				-        # assert (roi_map_probs[k, y_int, x_int] ==
			
 
				-        #         roi_map_probs[k, :, :].max())
			
 
				-        x = (x_int.float() + 0.5) * width_correction
			
 
				-        y = (y_int.float() + 0.5) * height_correction
			
 
				-        xy_preds[i, 0, :] = x + offset_x[i]
			
 
				-        xy_preds[i, 1, :] = y + offset_y[i]
			
 
				+        xy_preds[i, 0, :] = x
			
 
				+        xy_preds[i, 1, :] = y
			
 
				         xy_preds[i, 2, :] = 1
			
 
				-        end_scores[i, :] = roi_map[torch.arange(1, device=roi_map.device), y_int, x_int]
			
 
				+        end_scores[i, :] = roi_map[torch.arange(1, device=roi_map.device), y, x]
			
 
				 
			
 
				     return xy_preds.permute(0, 2, 1), end_scores
			
 
				 
			
@@ -544,30 +586,29 @@ def lines_features_align(features, proposals, img_size):
 
				     print(f'lines_features_align features:{features.shape}')
			
 
				 
			
 
				     align_feat_list = []
			
 
				-    for feat, proposals_per_img  in zip(features,proposals):
			
 
				+    for feat, proposals_per_img in zip(features, proposals):
			
 
				         # print(f'lines_features_align feat:{feat.shape}, proposals_per_img:{proposals_per_img.shape}')
			
 
				 
			
 
				-        feat=feat.unsqueeze(0)
			
 
				+        feat = feat.unsqueeze(0)
			
 
				         for proposal in proposals_per_img:
			
 
				             align_feat = torch.zeros_like(feat)
			
 
				             # print(f'align_feat:{align_feat.shape}')
			
 
				             x1, y1, x2, y2 = map(lambda v: int(v.item()), proposal)
			
 
				             # 将每个proposal框内的部分赋值到align_feats对应位置
			
 
				-            align_feat[:,:, y1:y2 + 1, x1:x2 + 1] = feat[:,:, y1:y2 + 1, x1:x2 + 1]
			
 
				+            align_feat[:, :, y1:y2 + 1, x1:x2 + 1] = feat[:, :, y1:y2 + 1, x1:x2 + 1]
			
 
				             align_feat_list.append(align_feat)
			
 
				 
			
 
				-
			
 
				-    feats_tensor=torch.cat(align_feat_list)
			
 
				+    feats_tensor = torch.cat(align_feat_list)
			
 
				 
			
 
				     print(f'align features :{feats_tensor.shape}')
			
 
				 
			
 
				-    return  feats_tensor
			
 
				+    return feats_tensor
			
 
				 
			
 
				 
			
 
				 def lines_point_pair_loss(line_logits, proposals, gt_lines, line_matched_idxs):
			
 
				     # type: (Tensor, List[Tensor], List[Tensor], List[Tensor]) -> Tensor
			
 
				     N, K, H, W = line_logits.shape
			
 
				-    len_proposals=len(proposals)
			
 
				+    len_proposals = len(proposals)
			
 
				     print(f'lines_point_pair_loss line_logits.shape:{line_logits.shape},len_proposals:{len_proposals}')
			
 
				     if H != W:
			
 
				         raise ValueError(
			
@@ -575,7 +616,7 @@ def lines_point_pair_loss(line_logits, proposals, gt_lines, line_matched_idxs):
 
				         )
			
 
				     discretization_size = H
			
 
				     heatmaps = []
			
 
				-    gs_heatmaps=[]
			
 
				+    gs_heatmaps = []
			
 
				     valid = []
			
 
				     for proposals_per_image, gt_kp_in_image, midx in zip(proposals, gt_lines, line_matched_idxs):
			
 
				         print(f'proposals_per_image:{proposals_per_image.shape}')
			
@@ -584,13 +625,12 @@ def lines_point_pair_loss(line_logits, proposals, gt_lines, line_matched_idxs):
 
				         gs_heatmaps.append(gs_heatmaps_per_img)
			
 
				         # print(f'heatmaps_per_image:{heatmaps_per_image.shape}')
			
 
				 
			
 
				-
			
 
				         # heatmaps.append(heatmaps_per_image.view(-1))
			
 
				 
			
 
				         # valid.append(valid_per_image.view(-1))
			
 
				 
			
 
				     # line_targets = torch.cat(heatmaps, dim=0)
			
 
				-    gs_heatmaps=torch.cat(gs_heatmaps,dim=0)
			
 
				+    gs_heatmaps = torch.cat(gs_heatmaps, dim=0)
			
 
				     print(f'gs_heatmaps:{gs_heatmaps.shape}, line_logits.shape:{line_logits.squeeze(1).shape}')
			
 
				     # print(f'line_targets:{line_targets.shape},{line_targets}')
			
 
				 
			
@@ -606,10 +646,10 @@ def lines_point_pair_loss(line_logits, proposals, gt_lines, line_matched_idxs):
 
				 
			
 
				     # line_logits = line_logits.view(N * K, H * W)
			
 
				     # print(f'line_logits[valid]:{line_logits[valid].shape}')
			
 
				-    line_logits=line_logits.squeeze(1)
			
 
				+    line_logits = line_logits.squeeze(1)
			
 
				 
			
 
				     # line_loss = F.cross_entropy(line_logits[valid], line_targets[valid])
			
 
				-    line_loss=F.cross_entropy(line_logits,gs_heatmaps)
			
 
				+    line_loss = F.cross_entropy(line_logits, gs_heatmaps)
			
 
				 
			
 
				     return line_loss
			
 
				 
			
@@ -647,6 +687,7 @@ def lines_to_boxes(lines, img_size=511):
 
				     boxes = torch.stack([x_min, y_min, x_max, y_max], dim=1)  # (N, 4)
			
 
				     return boxes
			
 
				 
			
 
				+
			
 
				 def box_iou_pairwise(box1, box2):
			
 
				     """
			
 
				     输入：
			
@@ -669,33 +710,63 @@ def box_iou_pairwise(box1, box2):
 
				     ious = inter_area / (union_area + 1e-6)
			
 
				 
			
 
				     return ious
			
 
				-def line_iou_loss(x, boxes, gt_lines, matched_idx, img_size=511):
			
 
				+
			
 
				+
			
 
				+def line_iou_loss(x, boxes, gt_lines, matched_idx, img_size=511, alpha=1.0, beta=1.0, gamma=1.0):
			
 
				+    """
			
 
				+    Args:
			
 
				+        x: [N,1,H,W] 热力图
			
 
				+        boxes: [N,4] 框坐标
			
 
				+        gt_lines: [N,2,3] GT线段（含可见性）
			
 
				+        matched_idx: 匹配 index
			
 
				+        img_size: 图像尺寸
			
 
				+        alpha: IoU 损失权重
			
 
				+        beta: 长度损失权重
			
 
				+        gamma: 方向角度损失权重
			
 
				+    """
			
 
				     losses = []
			
 
				     boxes_per_image = [box.size(0) for box in boxes]
			
 
				     x2 = x.split(boxes_per_image, dim=0)
			
 
				 
			
 
				     for xx, bb, gt_line, mid in zip(x2, boxes, gt_lines, matched_idx):
			
 
				-        p_prob, scores = heatmaps_to_lines(xx, bb)
			
 
				+        p_prob, _ = heatmaps_to_lines(xx, bb)
			
 
				         pred_lines = p_prob
			
 
				         gt_line_points = gt_line[mid]
			
 
				 
			
 
				         if len(pred_lines) == 0 or len(gt_line_points) == 0:
			
 
				             continue
			
 
				 
			
 
				+        # IoU 损失
			
 
				         pred_boxes = lines_to_boxes(pred_lines, img_size)
			
 
				         gt_boxes = lines_to_boxes(gt_line_points, img_size)
			
 
				-
			
 
				         ious = box_iou_pairwise(pred_boxes, gt_boxes)
			
 
				+        iou_loss = 1.0 - ious  # [N]
			
 
				+
			
 
				+        # 长度损失
			
 
				+        pred_len = line_length(pred_lines)
			
 
				+        gt_len = line_length(gt_line_points)
			
 
				+        length_diff = F.l1_loss(pred_len, gt_len, reduction='none')  # [N]
			
 
				+
			
 
				+        # 方向角度损失
			
 
				+        pred_dir = line_direction(pred_lines)
			
 
				+        gt_dir = line_direction(gt_line_points)
			
 
				+        ang_loss = angle_loss_cosine(pred_dir, gt_dir)  # [N]
			
 
				 
			
 
				-        loss = 1.0 - ious
			
 
				-        losses.append(loss)
			
 
				+        # 归一化每一项损失
			
 
				+        norm_iou = normalize_tensor(iou_loss)
			
 
				+        norm_len = normalize_tensor(length_diff)
			
 
				+        norm_ang = normalize_tensor(ang_loss)
			
 
				 
			
 
				-    if not losses:  # 如果损失列表为空，则返回默认值或抛出自定义异常
			
 
				-        print("Warning: No valid losses were computed.")
			
 
				-        return torch.tensor(1.0, requires_grad=True).to(x.device)  # 返回一个标量张量
			
 
				+        total = alpha * norm_iou + beta * norm_len + gamma * norm_ang
			
 
				+        losses.append(total)
			
 
				+
			
 
				+
			
 
				+
			
 
				+    if not losses:
			
 
				+        return None
			
 
				+
			
 
				+    return torch.mean(torch.cat(losses))
			
 
				 
			
 
				-    total_loss = torch.mean(torch.cat(losses))
			
 
				-    return total_loss
			
 
				 
			
 
				 def line_inference(x, boxes):
			
 
				     # type: (Tensor, List[Tensor]) -> Tuple[List[Tensor], List[Tensor]]
			
@@ -710,12 +781,9 @@ def line_inference(x, boxes):
 
				         points_probs.append(p_prob)
			
 
				         points_scores.append(scores)
			
 
				 
			
 
				-
			
 
				-
			
 
				-
			
 
				-
			
 
				     return points_probs, points_scores
			
 
				 
			
 
				+
			
 
				 def keypointrcnn_loss(keypoint_logits, proposals, gt_keypoints, keypoint_matched_idxs):
			
 
				     # type: (Tensor, List[Tensor], List[Tensor], List[Tensor]) -> Tensor
			
 
				     N, K, H, W = keypoint_logits.shape
			
@@ -843,7 +911,7 @@ def paste_mask_in_image(mask, box, im_h, im_w):
 
				     y_0 = max(box[1], 0)
			
 
				     y_1 = min(box[3] + 1, im_h)
			
 
				 
			
 
				-    im_mask[y_0:y_1, x_0:x_1] = mask[(y_0 - box[1]) : (y_1 - box[1]), (x_0 - box[0]) : (x_1 - box[0])]
			
 
				+    im_mask[y_0:y_1, x_0:x_1] = mask[(y_0 - box[1]): (y_1 - box[1]), (x_0 - box[0]): (x_1 - box[0])]
			
 
				     return im_mask
			
 
				 
			
 
				 
			
@@ -868,7 +936,7 @@ def _onnx_paste_mask_in_image(mask, box, im_h, im_w):
 
				     y_0 = torch.max(torch.cat((box[1].unsqueeze(0), zero)))
			
 
				     y_1 = torch.min(torch.cat((box[3].unsqueeze(0) + one, im_h.unsqueeze(0))))
			
 
				 
			
 
				-    unpaded_im_mask = mask[(y_0 - box[1]) : (y_1 - box[1]), (x_0 - box[0]) : (x_1 - box[0])]
			
 
				+    unpaded_im_mask = mask[(y_0 - box[1]): (y_1 - box[1]), (x_0 - box[0]): (x_1 - box[0])]
			
 
				 
			
 
				     # TODO : replace below with a dynamic padding when support is added in ONNX
			
 
				 
			
@@ -919,31 +987,31 @@ class RoIHeads(nn.Module):
 
				     }
			
 
				 
			
 
				     def __init__(
			
 
				-        self,
			
 
				-        box_roi_pool,
			
 
				-        box_head,
			
 
				-        box_predictor,
			
 
				-        # Faster R-CNN training
			
 
				-        fg_iou_thresh,
			
 
				-        bg_iou_thresh,
			
 
				-        batch_size_per_image,
			
 
				-        positive_fraction,
			
 
				-        bbox_reg_weights,
			
 
				-        # Faster R-CNN inference
			
 
				-        score_thresh,
			
 
				-        nms_thresh,
			
 
				-        detections_per_img,
			
 
				-        # Line
			
 
				-        line_roi_pool=None,
			
 
				-        line_head=None,
			
 
				-        line_predictor=None,
			
 
				-        # Mask
			
 
				-        mask_roi_pool=None,
			
 
				-        mask_head=None,
			
 
				-        mask_predictor=None,
			
 
				-        keypoint_roi_pool=None,
			
 
				-        keypoint_head=None,
			
 
				-        keypoint_predictor=None,
			
 
				+            self,
			
 
				+            box_roi_pool,
			
 
				+            box_head,
			
 
				+            box_predictor,
			
 
				+            # Faster R-CNN training
			
 
				+            fg_iou_thresh,
			
 
				+            bg_iou_thresh,
			
 
				+            batch_size_per_image,
			
 
				+            positive_fraction,
			
 
				+            bbox_reg_weights,
			
 
				+            # Faster R-CNN inference
			
 
				+            score_thresh,
			
 
				+            nms_thresh,
			
 
				+            detections_per_img,
			
 
				+            # Line
			
 
				+            line_roi_pool=None,
			
 
				+            line_head=None,
			
 
				+            line_predictor=None,
			
 
				+            # Mask
			
 
				+            mask_roi_pool=None,
			
 
				+            mask_head=None,
			
 
				+            mask_predictor=None,
			
 
				+            keypoint_roi_pool=None,
			
 
				+            keypoint_head=None,
			
 
				+            keypoint_predictor=None,
			
 
				     ):
			
 
				         super().__init__()
			
 
				 
			
@@ -978,8 +1046,8 @@ class RoIHeads(nn.Module):
 
				         self.keypoint_predictor = keypoint_predictor
			
 
				 
			
 
				         self.channel_compress = nn.Sequential(
			
 
				-             nn.Conv2d(256, 16, kernel_size=1),
			
 
				-             nn.BatchNorm2d(16),
			
 
				+            nn.Conv2d(256, 16, kernel_size=1),
			
 
				+            nn.BatchNorm2d(16),
			
 
				             nn.ReLU(inplace=True)
			
 
				         )
			
 
				 
			
@@ -1073,9 +1141,9 @@ class RoIHeads(nn.Module):
 
				                 raise ValueError("Every element of targets should have a masks key")
			
 
				 
			
 
				     def select_training_samples(
			
 
				-        self,
			
 
				-        proposals,  # type: List[Tensor]
			
 
				-        targets,  # type: Optional[List[Dict[str, Tensor]]]
			
 
				+            self,
			
 
				+            proposals,  # type: List[Tensor]
			
 
				+            targets,  # type: Optional[List[Dict[str, Tensor]]]
			
 
				     ):
			
 
				         # type: (...) -> Tuple[List[Tensor], List[Tensor], List[Tensor], List[Tensor]]
			
 
				         self.check_targets(targets)
			
@@ -1111,11 +1179,11 @@ class RoIHeads(nn.Module):
 
				         return proposals, matched_idxs, labels, regression_targets
			
 
				 
			
 
				     def postprocess_detections(
			
 
				-        self,
			
 
				-        class_logits,  # type: Tensor
			
 
				-        box_regression,  # type: Tensor
			
 
				-        proposals,  # type: List[Tensor]
			
 
				-        image_shapes,  # type: List[Tuple[int, int]]
			
 
				+            self,
			
 
				+            class_logits,  # type: Tensor
			
 
				+            box_regression,  # type: Tensor
			
 
				+            proposals,  # type: List[Tensor]
			
 
				+            image_shapes,  # type: List[Tuple[int, int]]
			
 
				     ):
			
 
				         # type: (...) -> Tuple[List[Tensor], List[Tensor], List[Tensor]]
			
 
				         device = class_logits.device
			
@@ -1170,11 +1238,11 @@ class RoIHeads(nn.Module):
 
				         return all_boxes, all_scores, all_labels
			
 
				 
			
 
				     def forward(
			
 
				-        self,
			
 
				-        features,  # type: Dict[str, Tensor]
			
 
				-        proposals,  # type: List[Tensor]
			
 
				-        image_shapes,  # type: List[Tuple[int, int]]
			
 
				-        targets=None,  # type: Optional[List[Dict[str, Tensor]]]
			
 
				+            self,
			
 
				+            features,  # type: Dict[str, Tensor]
			
 
				+            proposals,  # type: List[Tensor]
			
 
				+            image_shapes,  # type: List[Tuple[int, int]]
			
 
				+            targets=None,  # type: Optional[List[Dict[str, Tensor]]]
			
 
				     ):
			
 
				         # type: (...) -> Tuple[List[Dict[str, Tensor]], Dict[str, Tensor]]
			
 
				         """
			
@@ -1239,7 +1307,6 @@ class RoIHeads(nn.Module):
 
				                     }
			
 
				                 )
			
 
				 
			
 
				-
			
 
				         if self.has_line():
			
 
				             print(f'roi_heads forward has_line()!!!!')
			
 
				             line_proposals = [p["boxes"] for p in result]
			
@@ -1281,27 +1348,23 @@ class RoIHeads(nn.Module):
 
				 
			
 
				             print(f'line_proposals:{len(line_proposals)}')
			
 
				 
			
 
				-
			
 
				-
			
 
				             # line_features = self.line_roi_pool(features, line_proposals, image_shapes)
			
 
				 
			
 
				-
			
 
				             # print(f'line_features from line_roi_pool:{line_features.shape}')
			
 
				 
			
 
				-            line_features=self.channel_compress(features['0'])
			
 
				-
			
 
				-            line_features=lines_features_align(line_features,line_proposals,image_shapes)
			
 
				+            line_features = self.channel_compress(features['0'])
			
 
				 
			
 
				+            line_features = lines_features_align(line_features, line_proposals, image_shapes)
			
 
				 
			
 
				             line_features = self.line_head(line_features)
			
 
				             print(f'line_features from line_head:{line_features.shape}')
			
 
				             # line_logits = self.line_predictor(line_features)
			
 
				 
			
 
				-            line_logits=line_features
			
 
				+            line_logits = line_features
			
 
				             print(f'line_logits:{line_logits.shape}')
			
 
				 
			
 
				             loss_line = {}
			
 
				-            loss_line_iou={}
			
 
				+            loss_line_iou = {}
			
 
				 
			
 
				             if self.training:
			
 
				 
			
@@ -1315,7 +1378,7 @@ class RoIHeads(nn.Module):
 
				                 rcnn_loss_line = lines_point_pair_loss(
			
 
				                     line_logits, line_proposals, gt_lines, pos_matched_idxs
			
 
				                 )
			
 
				-                iou_loss = line_iou_loss(line_logits, line_proposals, gt_lines, pos_matched_idxs,img_size)
			
 
				+                iou_loss = line_iou_loss(line_logits, line_proposals, gt_lines, pos_matched_idxs, img_size)
			
 
				 
			
 
				                 loss_line = {"loss_line": rcnn_loss_line}
			
 
				                 loss_line_iou = {'loss_line_iou': iou_loss}
			
@@ -1330,8 +1393,8 @@ class RoIHeads(nn.Module):
 
				                     )
			
 
				                     loss_line = {"loss_line": rcnn_loss_lines}
			
 
				 
			
 
				-                    iou_loss =line_iou_loss(line_logits, line_proposals,gt_lines,pos_matched_idxs,img_size)
			
 
				-                    loss_line_iou={'loss_line_iou':iou_loss}
			
 
				+                    iou_loss = line_iou_loss(line_logits, line_proposals, gt_lines, pos_matched_idxs, img_size)
			
 
				+                    loss_line_iou = {'loss_line_iou': iou_loss}
			
 
				 
			
 
				 
			
 
				                 else:
			
@@ -1349,8 +1412,6 @@ class RoIHeads(nn.Module):
 
				             losses.update(loss_line)
			
 
				             losses.update(loss_line_iou)
			
 
				 
			
 
				-
			
 
				-
			
 
				         if self.has_mask():
			
 
				             mask_proposals = [p["boxes"] for p in result]
			
 
				             if self.training:
			
@@ -1413,8 +1474,6 @@ class RoIHeads(nn.Module):
 
				 
			
 
				             keypoint_features = self.line_roi_pool(features, keypoint_proposals, image_shapes)
			
 
				 
			
 
				-
			
 
				-
			
 
				             keypoint_features = self.line_head(keypoint_features)
			
 
				             keypoint_logits = self.line_predictor(keypoint_features)