123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293 |
- import time
- from models.line_detect.postprocess import show_predict
- import os
- import torch
- from PIL import Image
- import matplotlib.pyplot as plt
- import matplotlib as mpl
- import numpy as np
- from models.line_detect.line_net import linenet_resnet50_fpn
- from torchvision import transforms
- # from models.wirenet.postprocess import postprocess
- from models.wirenet.postprocess import postprocess
- device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
- def load_best_model(model, save_path, device):
- if os.path.exists(save_path):
- checkpoint = torch.load(save_path, map_location=device)
- model.load_state_dict(checkpoint['model_state_dict'])
- # if optimizer is not None:
- # optimizer.load_state_dict(checkpoint['optimizer_state_dict'])
- epoch = checkpoint['epoch']
- loss = checkpoint['loss']
- print(f"Loaded best model from {save_path} at epoch {epoch} with loss {loss:.4f}")
- else:
- print(f"No saved model found at {save_path}")
- return model
- def box_line_(pred):
- for idx, box_ in enumerate(pred[0:-1]):
- box = box_['boxes'] # 是一个tensor
- line = pred[-1]['wires']['lines'][idx].cpu().numpy() / 128 * 512
- score = pred[-1]['wires']['score'][idx]
- line_ = []
- score_ = []
- for i in box:
- score_max = 0.0
- tmp = [[0.0, 0.0], [0.0, 0.0]]
- for j in range(len(line)):
- if (line[j][0][1] >= i[0] and line[j][1][1] >= i[0] and
- line[j][0][1] <= i[2] and line[j][1][1] <= i[2] and
- line[j][0][0] >= i[1] and line[j][1][0] >= i[1] and
- line[j][0][0] <= i[3] and line[j][1][0] <= i[3]):
- if score[j] > score_max:
- tmp = line[j]
- score_max = score[j]
- line_.append(tmp)
- score_.append(score_max)
- processed_list = torch.tensor(line_)
- pred[idx]['line'] = processed_list
- processed_s_list = torch.tensor(score_)
- pred[idx]['line_score'] = processed_s_list
- return pred
- def predict(pt_path, model, img):
- model = load_best_model(model, pt_path, device)
- model.eval()
- if isinstance(img, str):
- img = Image.open(img).convert("RGB")
- transform = transforms.ToTensor()
- img_tensor = transform(img)
- with torch.no_grad():
- predictions = model([img_tensor.to(device)])
- # print(predictions)
- pred = box_line_(predictions)
- # print(f'pred:{pred[0]}')
- show_predict(img_tensor, pred, t_start)
- if __name__ == '__main__':
- t_start = time.time()
- print(f'start to predict:{t_start}')
- model = linenet_resnet50_fpn().to(device)
- pt_path = r'D:\python\PycharmProjects\lcnn-master\lcnn_\20250212\MultiVisionModels\models\line_detect\linenet_wts\resnet50_best_e8.pth'
- img_path = f'D:\python\PycharmProjects\data2\images/train/2024-11-27-15-41-38_SaveImage.png' # 工件图
- # img_path = f'D:\python\PycharmProjects\data\images/train/00558656_3.png' # wireframe图
- predict(pt_path, model, img_path)
- t_end = time.time()
- print(f'predict used:{t_end - t_start}')
|