5 months ago · e0a7d535e4
--- a/libs/vision_libs/models/detection/rpn.py
+++ b/libs/vision_libs/models/detection/rpn.py
@@ -357,7 +357,9 @@ class RegionProposalNetwork(torch.nn.Module):
 
															         """
														
 
															         # RPN uses all feature maps that are available
														
 
															         features = list(features.values())
														
 
															+
														
 
															         objectness, pred_bbox_deltas = self.head(features)
														
 
															+
														
 
															         anchors = self.anchor_generator(images, features)
														
 
															         num_images = len(anchors)
														
@@ -385,4 +387,5 @@ class RegionProposalNetwork(torch.nn.Module):
 
															                 "loss_objectness": loss_objectness,
														
 
															                 "loss_rpn_box_reg": loss_rpn_box_reg,
														
 
															             }
														
 
															+        # print(f'boxes:{boxes[0].shape}')
														
 
															         return boxes, losses
														
--- a/models/base/base_detection_net.py
+++ b/models/base/base_detection_net.py
@@ -114,6 +114,11 @@ class BaseDetectionNet(BaseModel):
 
															             features = OrderedDict([("0", features)])
														
 
															         proposals, proposal_losses = self.rpn(images, features, targets)
														
 
															+
														
 
															+        # print(f'proposals:{proposals[0].shape}')
														
 
															+
														
 
															+
														
 
															+
														
 
															         detections, detector_losses = self.roi_heads(features, proposals, images.image_sizes, targets)
														
 
															         detections = self.transform.postprocess(detections, images.image_sizes, original_image_sizes)  # type: ignore[operator]
														
--- a/models/base/high_reso_resnet.py
+++ b/models/base/high_reso_resnet.py
@@ -88,8 +88,29 @@ class Bottleneck(nn.Module):
 
															 # ResNet 主类
														
 
															 # ----------------------------
														
 
															+def resnet18fpn(out_channels=256):
														
 
															+    backbone = ResNet(Bottleneck,[2,2,2])
														
 
															+    return_layers = {
														
 
															+        'encoder0': '0',
														
 
															+        'encoder1': '1',
														
 
															+        'encoder2': '2',
														
 
															+        'encoder3': '3',
														
 
															+        # 'encoder4': '5'
														
 
															+    }
														
 
															+
														
 
															+    # in_channels_list = [self.inplanes, 64, 128, 256, 512]
														
 
															+    # in_channels_list = [64, 256, 512, 1024, 2048]
														
 
															+    in_channels_list = [64, 256, 512, 1024]
														
 
															+
														
 
															+    return BackboneWithFPN(
														
 
															+        backbone,
														
 
															+        return_layers=return_layers,
														
 
															+        in_channels_list=in_channels_list,
														
 
															+        out_channels=out_channels,
														
 
															+    )
														
 
															+
														
 
															 def resnet50fpn(out_channels=256):
														
 
															-    backbone = ResNet(Bottleneck)
														
 
															+    backbone = ResNet(Bottleneck,[3,4,6])
														
 
															     return_layers = {
														
 
															         'encoder0': '0',
														
 
															         'encoder1': '1',
														
@@ -111,7 +132,7 @@ def resnet50fpn(out_channels=256):
 
															 class ResNet(nn.Module):
														
 
															-    def __init__(self, block: Type[Union[Bottleneck]],):
														
 
															+    def __init__(self, block: Type[Union[Bottleneck]], layers: List[int],):
														
 
															         super(ResNet, self).__init__()
														
 
															         self._norm_layer = nn.BatchNorm2d
														
 
															         self.inplanes = 64
														
@@ -126,9 +147,9 @@ class ResNet(nn.Module):
 
															             nn.ReLU(inplace=True),
														
 
															             nn.MaxPool2d(kernel_size=3, stride=1, padding=1)
														
 
															         )
														
 
															-        self.encoder1 = self._make_layer(block, 64, 3,stride=2)
														
 
															-        self.encoder2 = self._make_layer(block, 128, 4, stride=2)
														
 
															-        self.encoder3 = self._make_layer(block, 256, 6, stride=2)
														
 
															+        self.encoder1 = self._make_layer(block, 64, layers[0],stride=2)
														
 
															+        self.encoder2 = self._make_layer(block, 128, layers[1], stride=2)
														
 
															+        self.encoder3 = self._make_layer(block, 256, layers[2], stride=2)
														
 
															         # self.encoder4 = self._make_layer(block, 512, 3, stride=2)
														
 
															         # self.encoder5 = self._make_layer(block, 512, 3, stride=2)
														
 
															         # self.body = nn.ModuleDict({
														
@@ -253,7 +274,7 @@ if __name__ == "__main__":
 
															     input_tensor = torch.randn(1, 3, 512, 512).to(device)
														
 
															     output_tensor = model(input_tensor)
														
 
															-    backbone = ResNet(Bottleneck).to(device)
														
 
															+    backbone = ResNet(Bottleneck,[3,4,6]).to(device)
														
 
															     features = backbone(input_tensor)
														
 
															     print("Raw backbone output:", list(features.keys()))
														
 
															     print(f"Input shape: {input_tensor.shape}")
														
--- a/models/line_detect/line_net.py
+++ b/models/line_detect/line_net.py
@@ -34,7 +34,7 @@ from ..base.base_detection_net import BaseDetectionNet
 
															 import torch.nn.functional as F
														
 
															 from .predict import Predict1, Predict
														
 
															-from ..base.resnet50fpn import resnet50fpn
														
 
															+from ..base.high_reso_resnet import resnet50fpn, resnet18fpn
														
 
															 from ..config.config_tool import read_yaml
														
@@ -526,8 +526,60 @@ class LineNet_MobileNet_V3_Large_320_FPN_Weights(WeightsEnum):
 
															         },
														
 
															     )
														
 
															     DEFAULT = COCO_V1
														
 
															+def linenet_newresnet18fpn(
														
 
															+        *,
														
 
															+        weights: Optional[LineNet_ResNet50_FPN_Weights] = None,
														
 
															+        progress: bool = True,
														
 
															+        num_classes: Optional[int] = None,
														
 
															+        weights_backbone: Optional[ResNet18_Weights] = ResNet18_Weights.IMAGENET1K_V1,
														
 
															+        trainable_backbone_layers: Optional[int] = None,
														
 
															+        **kwargs: Any,
														
 
															+) -> LineNet:
														
 
															+    # weights = LineNet_ResNet50_FPN_Weights.verify(weights)
														
 
															+    # weights_backbone = ResNet50_Weights.verify(weights_backbone)
														
 
															+
														
 
															+    if weights is not None:
														
 
															+        weights_backbone = None
														
 
															+        num_classes = _ovewrite_value_param("num_classes", num_classes, len(weights.meta["categories"]))
														
 
															+    elif num_classes is None:
														
 
															+        num_classes = 91
														
 
															+    if weights_backbone is not None:
														
 
															+        print(f'resnet50 weights is not None')
														
 
															+
														
 
															+    is_trained = weights is not None or weights_backbone is not None
														
 
															+    trainable_backbone_layers = _validate_trainable_layers(is_trained, trainable_backbone_layers, 5, 3)
														
 
															+    norm_layer = misc_nn_ops.FrozenBatchNorm2d if is_trained else nn.BatchNorm2d
														
 
															+
														
 
															+    backbone =resnet18fpn()
														
 
															+    featmap_names=['0', '1', '2', '3','pool']
														
 
															+    # print(f'featmap_names:{featmap_names}')
														
 
															+    roi_pooler = MultiScaleRoIAlign(
														
 
															+        featmap_names=featmap_names,
														
 
															+        output_size=7,
														
 
															+        sampling_ratio=2
														
 
															+    )
														
 
															+    num_features=len(featmap_names)
														
 
															+    anchor_sizes = tuple((int(16 * 2 ** i),) for i in range(num_features))  # 自动生成不同大小
														
 
															+    # print(f'anchor_sizes:{anchor_sizes}')
														
 
															+    aspect_ratios = ((0.5, 1.0, 2.0),) * num_features
														
 
															+    # print(f'aspect_ratios:{aspect_ratios}')
														
 
															+    anchor_generator =  AnchorGenerator(sizes=anchor_sizes, aspect_ratios=aspect_ratios)
														
 
															+    # anchors = anchor_generator.generate_anchors()
														
 
															+    # print("Number of anchor sizes:", len(anchor_generator.sizes))  # 应为 5
														
 
															+    model = LineNet(backbone, num_classes=num_classes,anchor_generator=anchor_generator,
														
 
															+
														
 
															+                    box_roi_pool=roi_pooler,
														
 
															+                    **kwargs)
														
 
															+
														
 
															+    if weights is not None:
														
 
															+        model.load_state_dict(weights.get_state_dict(progress=progress, check_hash=True))
														
 
															+        if weights == LineNet_ResNet50_FPN_Weights.COCO_V1:
														
 
															+            overwrite_eps(model, 0.0)
														
 
															+
														
 
															+    return model
														
 
															+
														
 
															 def linenet_newresnet50fpn(
														
 
															         *,
														
 
															         weights: Optional[LineNet_ResNet50_FPN_Weights] = None,
														
--- a/models/line_detect/line_predictor.py
+++ b/models/line_detect/line_predictor.py
@@ -106,11 +106,11 @@ class LineRCNNPredictor(nn.Module):
 
															         else:
														
 
															             self.pooling = nn.MaxPool1d(scale_factor, scale_factor)
														
 
															             self.fc2 = nn.Sequential(
														
 
															-                nn.Linear(self.dim_loi * self.n_pts1 + FEATURE_DIM, self.dim_fc*16),
														
 
															+                nn.Linear(self.dim_loi * self.n_pts1 + FEATURE_DIM, self.dim_fc*2),
														
 
															                 nn.ReLU(inplace=True),
														
 
															-                nn.Linear(self.dim_fc*16, self.dim_fc*8),
														
 
															+                nn.Linear(self.dim_fc*2, self.dim_fc*2),
														
 
															                 nn.ReLU(inplace=True),
														
 
															-                nn.Linear(self.dim_fc*8, 1),
														
 
															+                nn.Linear(self.dim_fc*2, 1),
														
 
															             )
														
 
															         self.loss = nn.BCEWithLogitsLoss(reduction="none")
														
--- a/models/line_detect/train.yaml
+++ b/models/line_detect/train.yaml
@@ -1,6 +1,6 @@
 
															 io:
														
 
															   logdir: train_results
														
 
															-  datadir: /data/share/lm/Dataset_all
														
 
															+  datadir: \\192.168.50.222/share/lm/Dataset_all
														
 
															 #  datadir: D:\python\PycharmProjects\data_20250223\0423_
														
 
															 #  datadir: I:\datasets\wirenet_1000
														
--- a/models/line_detect/train_demo.py
+++ b/models/line_detect/train_demo.py
@@ -1,7 +1,7 @@
 
															 import torch
														
 
															 from models.line_detect.line_net import linenet_resnet50_fpn, LineNet, linenet_resnet18_fpn, linenet_newresnet50fpn, \
														
 
															-    get_line_net_convnext_fpn
														
 
															+    get_line_net_convnext_fpn, linenet_newresnet18fpn
														
 
															 from models.line_detect.trainer import Trainer
														
 
															 device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
														
@@ -11,8 +11,9 @@ if __name__ == '__main__':
 
															     # model=linenet_resnet50_fpn()
														
 
															     # model = linenet_resnet18_fpn()
														
 
															     # model=get_line_net_convnext_fpn(num_classes=2).to(device)
														
 
															-    model=linenet_newresnet50fpn()
														
 
															-    # model.load_best_model('train_results/20250622_143530/weights/best_val.pth')
														
 
															+    # model=linenet_newresnet50fpn()
														
 
															+    model = linenet_newresnet18fpn()
														
 
															+    model.load_best_model('train_results/20250622_140412/weights/best_val.pth')
														
 
															     # trainer = Trainer()
														
 
															     # trainer.train_cfg(model,cfg='./train.yaml')
														
 
															     model.start_train(cfg='train.yaml')