5 months ago · 51ec3b67b1
--- a/libs/vision_libs/models/detection/transform.py
+++ b/libs/vision_libs/models/detection/transform.py
@@ -201,6 +201,11 @@ class GeneralizedRCNNTransform(nn.Module):
 
															             keypoints = target["keypoints"]
														
 
															             keypoints = resize_keypoints(keypoints, (h, w), image.shape[-2:])
														
 
															             target["keypoints"] = keypoints
														
 
															+
														
 
															+        if "lines" in target:
														
 
															+            lines = target["lines"]
														
 
															+            lines = resize_keypoints(lines, (h, w), image.shape[-2:])
														
 
															+            target["lines"] = lines
														
 
															         return image, target
														
 
															     # _onnx_batch_images() is an implementation of
														
@@ -274,6 +279,11 @@ class GeneralizedRCNNTransform(nn.Module):
 
															                 keypoints = pred["keypoints"]
														
 
															                 keypoints = resize_keypoints(keypoints, im_s, o_im_s)
														
 
															                 result[i]["keypoints"] = keypoints
														
 
															+
														
 
															+            if "lines" in pred:
														
 
															+                keypoints = pred["lines"]
														
 
															+                keypoints = resize_keypoints(keypoints, im_s, o_im_s)
														
 
															+                result[i]["lines"] = keypoints
														
 
															         return result
														
 
															     def __repr__(self) -> str:
														
--- a/models/base/base_detection_net.py
+++ b/models/base/base_detection_net.py
@@ -92,6 +92,7 @@ class BaseDetectionNet(BaseModel):
 
															             original_image_sizes.append((val[0], val[1]))
														
 
															         images, targets = self.transform(images, targets)
														
 
															+        # print(f'images shape from transform:{images.tensors.shape }')
														
 
															         # Check for degenerate boxes
														
 
															         # TODO: Move this to a function
														
--- a/models/keypoint/keypoint_dataset.py
+++ b/models/keypoint/keypoint_dataset.py
@@ -202,6 +202,7 @@ def line_boxes(target):
 
															                 xmax = b[0] + 1
														
 
															             boxs.append([ymin, xmin, ymax, xmax])
														
 
															+    print(f'torch.tensor(boxs):{torch.tensor(boxs).shape},torch.tensor(keypoints):{torch.tensor(keypoints).shape}')
														
 
															     return torch.tensor(boxs), torch.tensor(keypoints)
														
 
															 if __name__ == '__main__':
														
--- a/models/line_detect/line_dataset.py
+++ b/models/line_detect/line_dataset.py
@@ -31,7 +31,10 @@ def validate_keypoints(keypoints, image_width, image_height):
 
															         if not (0 <= x < image_width and 0 <= y < image_height):
														
 
															             raise ValueError(f"Key point ({x}, {y}) is out of bounds for image size ({image_width}, {image_height})")
														
 
															+"""
														
 
															+直接读取xanlabel标注的数据集json格式
														
 
															+"""
														
 
															 class LineDataset(BaseDataset):
														
 
															     def __init__(self, dataset_path, data_type, transforms=None, dataset_type=None,img_type='rgb', target_type='pixel'):
														
 
															         super().__init__(dataset_path)
														
@@ -50,28 +53,20 @@ class LineDataset(BaseDataset):
 
															     def __getitem__(self, index) -> T_co:
														
 
															         img_path = os.path.join(self.img_path, self.imgs[index])
														
 
															-        if self.data_type == 'tiff':
														
 
															-            lbl_path = os.path.join(self.lbl_path, self.imgs[index][:-4] + 'json')
														
 
															-            # img = imageio.v3.imread(img_path).reshape(512, 512, 1)
														
 
															-            img = imageio.v3.imread(img_path)[:, :, :3]
														
 
															-            # img_3channel = np.zeros((512, 512, 3), dtype=img.dtype)
														
 
															-            # img_3channel[:, :, 2] = img[:, :, 0]
														
 
															-
														
 
															-            img_3channel=img
														
 
															-            w, h = img.shape[:2]
														
 
															-            img = torch.from_numpy(img_3channel).permute(2, 0, 1)
														
 
															-        else:
														
 
															-            lbl_path = os.path.join(self.lbl_path, self.imgs[index][:-3] + 'json')
														
 
															-            img = PIL.Image.open(img_path).convert('RGB')
														
 
															-            w, h = img.size
														
 
															+
														
 
															+        lbl_path = os.path.join(self.lbl_path, self.imgs[index][:-3] + 'json')
														
 
															+        img = PIL.Image.open(img_path).convert('RGB')
														
 
															+        w, h = img.size
														
 
															         # wire_labels, target = self.read_target(item=index, lbl_path=lbl_path, shape=(h, w))
														
 
															         target = self.read_target(item=index, lbl_path=lbl_path, shape=(h, w))
														
 
															         if self.transforms:
														
 
															             img, target = self.transforms(img, target)
														
 
															+
														
 
															         else:
														
 
															             img = self.default_transform(img)
														
 
															         # print(f'img:{img}')
														
 
															+        # print(f'img shape:{img.shape}')
														
 
															         return img, target
														
 
															     def __len__(self):
														
@@ -83,78 +78,31 @@ class LineDataset(BaseDataset):
 
															         with open(lbl_path, 'r') as file:
														
 
															             lable_all = json.load(file)
														
 
															-        n_stc_posl = 300
														
 
															-        n_stc_negl = 40
														
 
															-        use_cood = 0
														
 
															-        use_slop = 0
														
 
															-
														
 
															-        wire = lable_all["wires"][0]  # 字典
														
 
															-        line_pos_coords = np.random.permutation(wire["line_pos_coords"]["content"])[: n_stc_posl]  # 不足，有多少取多少
														
 
															-        line_neg_coords = np.random.permutation(wire["line_neg_coords"]["content"])[: n_stc_negl]
														
 
															-        npos, nneg = len(line_pos_coords), len(line_neg_coords)
														
 
															-        lpre = np.concatenate([line_pos_coords, line_neg_coords], 0)  # 正负样本坐标合在一起
														
 
															-        for i in range(len(lpre)):
														
 
															-            if random.random() > 0.5:
														
 
															-                lpre[i] = lpre[i, ::-1]
														
 
															-        ldir = lpre[:, 0, :2] - lpre[:, 1, :2]
														
 
															-        ldir /= np.clip(LA.norm(ldir, axis=1, keepdims=True), 1e-6, None)
														
 
															-        feat = [
														
 
															-            lpre[:, :, :2].reshape(-1, 4) / 128 * use_cood,
														
 
															-            ldir * use_slop,
														
 
															-            lpre[:, :, 2],
														
 
															-        ]
														
 
															-        feat = np.concatenate(feat, 1)
														
 
															-
														
 
															-        wire_labels = {
														
 
															-            "junc_coords": torch.tensor(wire["junc_coords"]["content"]),
														
 
															-            "jtyp": torch.tensor(wire["junc_coords"]["content"])[:, 2].byte(),
														
 
															-            "line_pos_idx": adjacency_matrix(len(wire["junc_coords"]["content"]), wire["line_pos_idx"]["content"]),
														
 
															-            # 真实存在线条的邻接矩阵
														
 
															-            "line_neg_idx": adjacency_matrix(len(wire["junc_coords"]["content"]), wire["line_neg_idx"]["content"]),
														
 
															-
														
 
															-            "lpre": torch.tensor(lpre)[:, :, :2],
														
 
															-            "lpre_label": torch.cat([torch.ones(npos), torch.zeros(nneg)]),  # 样本对应标签 1，0
														
 
															-            "lpre_feat": torch.from_numpy(feat),
														
 
															-            "junc_map": torch.tensor(wire['junc_map']["content"]),
														
 
															-            "junc_offset": torch.tensor(wire['junc_offset']["content"]),
														
 
															-            "line_map": torch.tensor(wire['line_map']["content"]),
														
 
															-        }
														
 
															-
														
 
															-        labels = []
														
 
															-        if self.target_type == 'polygon':
														
 
															-            labels, masks = read_masks_from_txt_wire(lbl_path, shape)
														
 
															-        elif self.target_type == 'pixel':
														
 
															-            labels = read_masks_from_pixels_wire(lbl_path, shape)
														
 
															-
														
 
															-        # print(torch.stack(masks).shape)    # [线段数, 512, 512]
														
 
															+
														
 
															+        objs = lable_all["shapes"]
														
 
															+        point_pairs=objs[0]['points']
														
 
															+
														
 
															+
														
 
															+        # print(f'point_pairs:{point_pairs}')
														
 
															         target = {}
														
 
															         target["image_id"] = torch.tensor(item)
														
 
															-        # return wire_labels, target
														
 
															-        target["wires"] = wire_labels
														
 
															-
														
 
															-        # target["labels"] = torch.stack(labels)
														
 
															-        # print(f'labels:{target["labels"]}')
														
 
															-        # target["boxes"] = line_boxes(target)
														
 
															-        target["boxes"], lines = get_boxes_lines(target)
														
 
															+        target["boxes"], lines = get_boxes_lines(objs,shape)
														
 
															+        # print(f'lines:{lines}')
														
 
															         target["labels"] = torch.ones(len(target["boxes"]), dtype=torch.int64)
														
 
															-        # keypoints=keypoints/512
														
 
															-        # visibility_flags = torch.ones((wire_labels["junc_coords"].shape[0], 1))
														
 
															-        # keypoints= wire_labels["junc_coords"]
														
 
															+
														
 
															         a = torch.full((lines.shape[0],), 2).unsqueeze(1)
														
 
															         lines = torch.cat((lines, a), dim=1)
														
 
															         target["lines"] = lines.to(torch.float32).view(-1,2,3)
														
 
															-        # print(f'boxes:{target["boxes"].shape}')
														
 
															-        # 在 __getitem__ 方法中调用此函数
														
 
															+        target["img_size"]=shape
														
 
															+
														
 
															         validate_keypoints(lines, shape[0], shape[1])
														
 
															-        # print(f'keypoints:{target["keypoints"].shape}')
														
 
															-        # print(f'target:{target}')
														
 
															         return target
														
 
															-    def show(self, idx):
														
 
															+    def show(self, idx,show_type='all'):
														
 
															         image, target = self.__getitem__(idx)
														
 
															         cmap = plt.get_cmap("jet")
														
@@ -164,12 +112,23 @@ class LineDataset(BaseDataset):
 
															         img_path = os.path.join(self.img_path, self.imgs[idx])
														
 
															         img = PIL.Image.open(img_path).convert('RGB')
														
 
															-        boxed_image = draw_bounding_boxes((self.default_transform(img) * 255).to(torch.uint8), target["boxes"],
														
 
															+        if show_type=='all':
														
 
															+            boxed_image = draw_bounding_boxes((self.default_transform(img) * 255).to(torch.uint8), target["boxes"],
														
 
															+                                                  colors="yellow", width=1)
														
 
															+            keypoint_img=draw_keypoints(boxed_image,target['lines'],colors='red',width=3)
														
 
															+            plt.imshow(keypoint_img.permute(1, 2, 0).numpy())
														
 
															+            plt.show()
														
 
															+
														
 
															+        if show_type=='lines':
														
 
															+            keypoint_img=draw_keypoints((self.default_transform(img) * 255).to(torch.uint8),target['lines'],colors='red',width=3)
														
 
															+            plt.imshow(keypoint_img.permute(1, 2, 0).numpy())
														
 
															+            plt.show()
														
 
															+
														
 
															+        if show_type=='boxes':
														
 
															+            boxed_image = draw_bounding_boxes((self.default_transform(img) * 255).to(torch.uint8), target["boxes"],
														
 
															                                               colors="yellow", width=1)
														
 
															-        keypoint_img=draw_keypoints(boxed_image,target['keypoints'],colors='red',width=3)
														
 
															-        plt.imshow(keypoint_img.permute(1, 2, 0).numpy())
														
 
															-        plt.show()
														
 
															-
														
 
															+            plt.imshow(boxed_image.permute(1, 2, 0).numpy())
														
 
															+            plt.show()
														
@@ -177,33 +136,35 @@ class LineDataset(BaseDataset):
 
															     def show_img(self, img_path):
														
 
															         pass
														
 
															-def get_boxes_lines(target):
														
 
															-    boxs = []
														
 
															-    lpre = target['wires']["lpre"].cpu().numpy()
														
 
															-    vecl_target = target['wires']["lpre_label"].cpu().numpy()
														
 
															-    lpre = lpre[vecl_target == 1]
														
 
															-    lines = lpre
														
 
															-    sline = np.ones(lpre.shape[0])
														
 
															+def get_boxes_lines(objs,shape):
														
 
															+    boxes = []
														
 
															+    h,w=shape
														
 
															     line_point_pairs = []
														
 
															-    if len(lines) > 0 and not (lines[0] == 0).all():
														
 
															-        for i, ((a, b), s) in enumerate(zip(lines, sline)):
														
 
															-            if i > 0 and (lines[i] == lines[0]).all():
														
 
															-                break
														
 
															-            # plt.plot([a[1], b[1]], [a[0], b[0]], c="red", linewidth=1)  # a[1], b[1]无明确大小
														
 
															-            line_point_pairs.append([a[1], a[0]])
														
 
															-            line_point_pairs.append([b[1], b[0]])
														
 
															+    for obj in objs:
														
 
															+        # plt.plot([a[1], b[1]], [a[0], b[0]], c="red", linewidth=1)  # a[1], b[1]无明确大小
														
 
															+
														
 
															+        # print(f"points:{obj['points']}")
														
 
															+
														
 
															+        a,b=obj['points'][0],obj['points'][1]
														
 
															+
														
 
															+        line_point_pairs.append(a)
														
 
															+        line_point_pairs.append(b)
														
 
															+
														
 
															+        xmin = max(0, (min(a[0], b[0]) - 6))
														
 
															+        xmax = min(w, (max(a[0], b[0]) + 6))
														
 
															+        ymin = max(0, (min(a[1], b[1]) - 6))
														
 
															+        ymax = min(h, (max(a[1], b[1]) + 6))
														
 
															-            xmin = max(0, (min(a[0], b[0]) - 6))
														
 
															-            xmax = min(511, (max(a[0], b[0]) + 6))
														
 
															-            ymin = max(0, (min(a[1], b[1]) - 6))
														
 
															-            ymax = min(511, (max(a[1], b[1]) + 6))
														
 
															+        boxes.append([ xmin,ymin,  xmax,ymax])
														
 
															-            boxs.append([ymin, xmin, ymax, xmax])
														
 
															+    boxes=torch.tensor(boxes)
														
 
															+    line_point_pairs=torch.tensor(line_point_pairs)
														
 
															-    return torch.tensor(boxs), torch.tensor(line_point_pairs)
														
 
															+    # print(f'boxes:{boxes.shape},line_point_pairs:{line_point_pairs.shape}')
														
 
															+    return boxes,line_point_pairs
														
 
															 if __name__ == '__main__':
														
 
															-    path=r"\\192.168.50.222/share/lm/Dataset_all"
														
 
															-    dataset= LineDataset(dataset_path=path, dataset_type='train')
														
 
															-    dataset.show(10)
														
 
															+    path=r"\\192.168.50.222/share/rlq/datasets/0706_"
														
 
															+    dataset= LineDataset(dataset_path=path, dataset_type='train',data_type='jpg')
														
 
															+    dataset.show(1,show_type='lines')
														
--- a/models/line_detect/line_detect.py
+++ b/models/line_detect/line_detect.py
@@ -35,7 +35,6 @@ from ..base.high_reso_resnet import resnet50fpn, resnet18fpn
 
															 __all__ = [
														
 
															     "LineDetect",
														
 
															-    "LineDetect_ResNet50_FPN_Weights",
														
 
															     "linedetect_resnet50_fpn",
														
 
															 ]
														
@@ -54,7 +53,7 @@ class LineDetect(BaseDetectionNet):
 
															             num_classes=None,
														
 
															             # transform parameters
														
 
															             min_size=512,
														
 
															-            max_size=1333,
														
 
															+            max_size=2048,
														
 
															             image_mean=None,
														
 
															             image_std=None,
														
 
															             # RPN parameters
														
--- a/models/line_detect/loi_heads.py
+++ b/models/line_detect/loi_heads.py
@@ -176,7 +176,7 @@ def line_points_to_heatmap(keypoints, rois, heatmap_size):
 
															     # show_heatmap(gs_heatmap[0],'feature')
														
 
															-    print(f'gs_heatmap:{gs_heatmap.shape}')
														
 
															+    # print(f'gs_heatmap:{gs_heatmap.shape}')
														
 
															     #
														
 
															     # lin_ind = y * heatmap_size + x
														
 
															     # print(f'lin_ind:{lin_ind.shape}')
														
@@ -622,8 +622,9 @@ def line_iou_loss(x, boxes, gt_lines, matched_idx, img_size=511):
 
															         loss = 1.0 - ious
														
 
															         losses.append(loss)
														
 
															-    if not losses:
														
 
															-        return None
														
 
															+    if not losses:  # 如果损失列表为空，则返回默认值或抛出自定义异常
														
 
															+        print("Warning: No valid losses were computed.")
														
 
															+        return torch.tensor(1, requires_grad=True).to(x.device)  # 返回一个标量张量
														
 
															     total_loss = torch.mean(torch.cat(losses))
														
 
															     return total_loss
														
@@ -1219,12 +1220,15 @@ class RoIHeads(nn.Module):
 
															             loss_line = {}
														
 
															             loss_line_iou={}
														
 
															-            img_size=512
														
 
															+
														
 
															             if self.training:
														
 
															+
														
 
															                 if targets is None or pos_matched_idxs is None:
														
 
															                     raise ValueError("both targets and pos_matched_idxs should not be None when in training mode")
														
 
															                 gt_lines = [t["lines"] for t in targets]
														
 
															+                h, w = targets[0]["img_size"]
														
 
															+                img_size = h
														
 
															                 rcnn_loss_line = lines_point_pair_loss(
														
 
															                     line_logits, line_proposals, gt_lines, pos_matched_idxs
														
 
															                 )
														
@@ -1235,6 +1239,8 @@ class RoIHeads(nn.Module):
 
															             else:
														
 
															                 if targets is not None:
														
 
															+                    h, w = targets[0]["img_size"]
														
 
															+                    img_size = h
														
 
															                     gt_lines = [t["lines"] for t in targets]
														
 
															                     rcnn_loss_lines = lines_point_pair_loss(
														
 
															                         line_logits, line_proposals, gt_lines, pos_matched_idxs
														
--- a/models/line_detect/train.yaml
+++ b/models/line_detect/train.yaml
@@ -1,7 +1,7 @@
 
															 io:
														
 
															   logdir: train_results
														
 
															-  datadir: /data/share/zyh/202507/a_dataset
														
 
															-  data_type: jpg
														
 
															+  datadir: \\192.168.50.222/share/rlq/datasets/0706_
														
 
															+  data_type: tiff
														
 
															 #  datadir: D:\python\PycharmProjects\data_20250223\0423_
														
 
															 #  datadir: I:\datasets\wirenet_1000
														
--- a/models/line_detect/train_demo.py
+++ b/models/line_detect/train_demo.py
@@ -15,8 +15,7 @@ if __name__ == '__main__':
 
															     # model=linenet_newresnet50fpn()
														
 
															     # model = lineDetect_resnet18_fpn()
														
 
															-    # model=linedetect_resnet18_fpn()
														
 
															-    model=linedetect_newresnet18fpn()
														
 
															-    model.load_weights(r'/home/admin/projects/MultiVisionModels/models/line_detect/train_results/20250706_150832/weights/best_val.pth')
														
 
															+    model=linedetect_resnet18_fpn()
														
 
															+    # model=linedetect_newresnet18fpn()
														
 
															     model.start_train(cfg='train.yaml')
														
--- a/models/line_detect/trainer.py
+++ b/models/line_detect/trainer.py
@@ -5,7 +5,7 @@ from datetime import datetime
 
															 import numpy as np
														
 
															 import torch
														
 
															 from matplotlib import pyplot as plt
														
 
															-from torch.optim.lr_scheduler import StepLR, ReduceLROnPlateau
														
 
															+from torch.optim.lr_scheduler import ReduceLROnPlateau
														
 
															 from torch.utils.tensorboard import SummaryWriter
														
 
															 from libs.vision_libs.utils import draw_bounding_boxes, draw_keypoints
														
@@ -274,9 +274,9 @@ class Trainer(BaseTrainer):
 
															         for epoch in range(self.max_epoch):
														
 
															             print(f"train epoch:{epoch}")
														
 
															-
														
 
															             model, epoch_train_loss = self.one_epoch(model, data_loader_train, epoch, optimizer)
														
 
															             scheduler.step(epoch_train_loss)
														
 
															+
														
 
															             # ========== Validation ==========
														
 
															             with torch.no_grad():
														
 
															                 model, epoch_val_loss = self.one_epoch(model, data_loader_val, epoch, optimizer, phase='val')
														
@@ -286,6 +286,7 @@ class Trainer(BaseTrainer):
 
															                 best_train_loss = epoch_train_loss
														
 
															                 best_val_loss = epoch_val_loss
														
 
															+
														
 
															             self.save_last_model(model,self.last_model_path, epoch, optimizer)
														
 
															             best_train_loss = self.save_best_model(model, self.best_train_model_path, epoch, epoch_train_loss,
														
 
															                                                    best_train_loss,
														
@@ -293,9 +294,6 @@ class Trainer(BaseTrainer):
 
															             best_val_loss = self.save_best_model(model, self.best_val_model_path, epoch, epoch_val_loss, best_val_loss,
														
 
															                                                  optimizer)
														
 
															-
														
 
															-
														
 
															-
														
 
															     def one_epoch(self, model, data_loader, epoch, optimizer, phase='train'):
														
 
															         if phase == 'train':
														
 
															             model.train()
														
@@ -331,7 +329,7 @@ class Trainer(BaseTrainer):
 
															                 t_start = time.time()
														
 
															                 print(f'start to predict:{t_start}')
														
 
															                 result = model(self.move_to_device(imgs, self.device))
														
 
															-                # print(f'result:{result}')
														
 
															+                print(f'result:{result}')
														
 
															                 t_end = time.time()
														
 
															                 print(f'predict used:{t_end - t_start}')
														
 
															                 self.writer_predict_result(img=imgs[0], result=result[0], epoch=epoch)