пре 6 месеци · 948627e972
--- a/models/line_detect/train.yaml
+++ b/models/line_detect/train.yaml
@@ -1,7 +1,7 @@
 
															 io:
														
 
															   logdir: train_results
														
 
															+#  datadir: /data/share/zyh/5月彩色钢板数据汇总/zjh/a_dataset
														
 
															   datadir: /data/share/lm/1-dataset/a_dataset
														
 
															-#  datadir: D:\python\PycharmProjects\data_20250223\0423_
														
 
															 #  datadir: I:\datasets\wirenet_1000
														
 
															   tensorboard_port: 6000
														
--- a/models/line_net/dataset_LD.py
+++ b/models/line_net/dataset_LD.py
@@ -1,9 +1,9 @@
 
															 # ??roi_head??????????????
														
 
															-from torch import dtype
														
 
															 from torch.utils.data.dataset import T_co
														
 
															+from libs.vision_libs.models.detection import MaskRCNN_ResNet50_FPN_V2_Weights
														
 
															 from models.base.base_dataset import BaseDataset
														
 
															-
														
 
															+from torchvision.transforms import  functional as F
														
 
															 import glob
														
 
															 import json
														
 
															 import math
														
@@ -70,6 +70,7 @@ class WirePointDataset(BaseDataset):
 
															         self.imgs = os.listdir(self.img_path)
														
 
															         self.lbls = os.listdir(self.lbl_path)
														
 
															         self.target_type = target_type
														
 
															+        self.transform = MaskRCNN_ResNet50_FPN_V2_Weights.DEFAULT.transforms()
														
 
															         # self.default_transform = DefaultTransform()
														
 
															     def __getitem__(self, index) -> T_co:
														
@@ -77,35 +78,61 @@ class WirePointDataset(BaseDataset):
 
															         lbl_path = os.path.join(self.lbl_path, self.imgs[index][:-3] + 'json')
														
 
															         # img = PIL.Image.open(img_path).convert('RGB')
														
 
															-        # w, h = img.size
														
 
															         img = cv2.imread(img_path, cv2.IMREAD_UNCHANGED)
														
 
															-        print(img.shape)
														
 
															-        w, h = img.shape[0:2]
														
 
															+        img_rgb=img[:,:,:3]
														
 
															+        print(f'img shape:{img.shape}')
														
 
															+        img_rgb=cv2.cvtColor(img_rgb, cv2.COLOR_BGR2RGB)
														
 
															+        # img=np.array(img,copy=True)
														
 
															+        # img = self.default_transform(img)
														
 
															+        # print(f'pil img:{img.dtype}')
														
 
															+        # w, h = img.size
														
 
															+        # img = cv2.imread(img_path, cv2.IMREAD_UNCHANGED)
														
 
															+        # cv2.imshow('img',img)
														
 
															+        # cv2.waitKey(1000000)
														
 
															+        # print(img.shape)
														
 
															+        w, h = img.shape[0:2]
														
 
															+        # w, h = img.size
														
 
															         # wire_labels, target = self.read_target(item=index, lbl_path=lbl_path, shape=(h, w))
														
 
															         target = self.read_target(item=index, lbl_path=lbl_path, shape=(h, w))
														
 
															+
														
 
															+        print(f'self.default_transform:{self.default_transform}')
														
 
															+
														
 
															         # if self.transforms:
														
 
															         #     img, target = self.transforms(img, target)
														
 
															         # else:
														
 
															         #     img = self.default_transform(img)
														
 
															-        # 分离RGB和深度通道
														
 
															-        rgb_channels = img[:, :, :3]
														
 
															-        depth_channel = img[:, :, 3]
														
 
															-        # rgb_normalized = rgb_channels.astype(np.float32) / 255.0
														
 
															-        rgb_normalized = rgb_channels
														
 
															-        depth_normalized = (depth_channel - depth_channel.min()) / (depth_channel.max() - depth_channel.min())*255
														
 
															-
														
 
															-        # 将归一化后的RGB和深度通道重新组合
														
 
															-        normalized_rgba_image = np.dstack((rgb_normalized, depth_normalized))  # 或者使用depth_normalized_fixed_range
														
 
															+        # # åç¦»RGBåæ·±åº¦éé
														
 
															+        # rgb_channels = img[:, :, :3]
														
 
															+        # depth_channel = img[:, :, 3]
														
 
															+        #
														
 
															+        # rgb_normalized = rgb_channels/255
														
 
															+        # depth_normalized = (depth_channel - depth_channel.min()) / (depth_channel.max() - depth_channel.min())*255
														
 
															+        #
														
 
															+        # # å°å½ä¸ååçRGBåæ·±åº¦éééæ°ç»å
														
 
															+        # normalized_rgba_image = np.dstack((rgb_normalized, depth_normalized))  # æèä½¿ç¨depth_normalized_fixed_range
														
 
															+        #
														
 
															+        # print("Normalized RGBA image shape:", normalized_rgba_image.shape)
														
 
															+        #
														
 
															+        # img = torch.tensor(normalized_rgba_image,dtype=torch.uint8).permute(2,1,0)
														
 
															-        print("Normalized RGBA image shape:", normalized_rgba_image.shape)
														
 
															-        img = torch.tensor(normalized_rgba_image,dtype=torch.float32).permute(2,1,0)
														
 
															+        # cv2.imshow('img',img[:3].permute(1,2,0).numpy().astype(np.uint8))
														
 
															+        # cv2.waitKey(10000000)
														
 
															+        # plt.imshow(img[:3].permute(1,2,0).numpy())
														
 
															+        # plt.show()
														
 
															         # new_channel = torch.zeros(1, 512, 512)
														
 
															         # img=torch.cat((img,new_channel),dim=0)
														
 
															+        img=np.dstack((img_rgb,img[:,:,3]))
														
 
															+
														
 
															+        img=torch.as_tensor(img).permute(2,0,1)
														
 
															+        img=self.default_transform(img)
														
 
															+
														
 
															+
														
 
															+        # img=F.convert_image_dtype(img, torch.float)
														
 
															         print(f'img:{img.shape}')
														
 
															         # print(f'img dtype:{img.dtype}')
														
 
															         return img, target
														
--- a/models/line_net/line_net.py
+++ b/models/line_net/line_net.py
@@ -214,11 +214,11 @@ class LineNet(BaseDetectionNet):
 
															         if image_mean is None:
														
 
															             # image_mean = [0.485, 0.456, 0.406]
														
 
															-            image_mean = [0.485, 0.456, 0.406, 0.5]  # 假设你新加的通道均值为0.5
														
 
															+            image_mean = [0.485, 0.456, 0.406,  0.2549]  # 假设你新加的通道均值为0.5
														
 
															         if image_std is None:
														
 
															             # image_std = [0.229, 0.224, 0.225]
														
 
															-            image_std = [0.229, 0.224, 0.225, 0.2]  # 标准差也补一个值
														
 
															+            image_std = [0.229, 0.224, 0.225, 0.4093]  # 标准差也补一个值
														
 
															         transform = GeneralizedRCNNTransform(min_size, max_size, image_mean, image_std, **kwargs)
														
 
															         super().__init__(backbone, rpn, roi_heads, transform)