lstlm
/
pokouqiege


			
							123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716
							from typing import Dict, List, Optional, Tuple

import matplotlib.pyplot as plt
import torch
import torch.nn.functional as F
import torchvision
# from scipy.optimize import linear_sum_assignment
from torch import nn, Tensor
from libs.vision_libs.ops import boxes as box_ops, roi_align

import libs.vision_libs.models.detection._utils as det_utils

from collections import OrderedDict

from models.line_detect.heads.head_losses import point_inference, compute_point_loss, line_iou_loss, \
    lines_point_pair_loss, features_align, line_inference, compute_mask_loss, arc_inference, compute_circle_loss, \
    circle_inference


def fastrcnn_loss(class_logits, box_regression, labels, regression_targets):
    # type: (Tensor, Tensor, List[Tensor], List[Tensor]) -> Tuple[Tensor, Tensor]
    """
    Computes the loss for Faster R-CNN.

    Args:
        class_logits (Tensor)
        box_regression (Tensor)
        labels (list[BoxList])
        regression_targets (Tensor)

    Returns:
        classification_loss (Tensor)
        box_loss (Tensor)
    """
    # print(f'compute fastrcnn_loss:{labels}')
    labels = torch.cat(labels, dim=0)
    regression_targets = torch.cat(regression_targets, dim=0)

    classification_loss = F.cross_entropy(class_logits, labels)

    # get indices that correspond to the regression targets for
    # the corresponding ground truth labels, to be used with
    # advanced indexing
    sampled_pos_inds_subset = torch.where(labels > 0)[0]
    labels_pos = labels[sampled_pos_inds_subset]
    N, num_classes = class_logits.shape
    box_regression = box_regression.reshape(N, box_regression.size(-1) // 4, 4)

    box_loss = F.smooth_l1_loss(
        box_regression[sampled_pos_inds_subset, labels_pos],
        regression_targets[sampled_pos_inds_subset],
        beta=1 / 9,
        reduction="sum",
    )
    box_loss = box_loss / labels.numel()

    return classification_loss, box_loss


def maskrcnn_inference(x, labels):
    # type: (Tensor, List[Tensor]) -> List[Tensor]
    """
    From the results of the CNN, post process the masks
    by taking the ins corresponding to the class with max
    probability (which are of fixed size and directly output
    by the CNN) and return the masks in the ins field of the BoxList.

    Args:
        x (Tensor): the ins logits
        labels (list[BoxList]): bounding boxes that are used as
            reference, one for ech image

    Returns:
        results (list[BoxList]): one BoxList for each image, containing
            the extra field ins
    """
    mask_prob = x.sigmoid()


    # select masks corresponding to the predicted classes
    num_masks = x.shape[0]
    boxes_per_image = [label.shape[0] for label in labels]
    labels = torch.cat(labels)
    index = torch.arange(num_masks, device=labels.device)
    mask_prob = mask_prob[index, labels][:, None]
    mask_prob = mask_prob.split(boxes_per_image, dim=0)


    return mask_prob


def project_masks_on_boxes(gt_masks, boxes, matched_idxs, M):
    # type: (Tensor, Tensor, Tensor, int) -> Tensor
    """
    Given segmentation masks and the bounding boxes corresponding
    to the location of the masks in the image, this function
    crops and resizes the masks in the position defined by the
    boxes. This prepares the masks for them to be fed to the
    loss computation as the targets.
    """
    matched_idxs = matched_idxs.to(boxes)
    rois = torch.cat([matched_idxs[:, None], boxes], dim=1)
    gt_masks = gt_masks[:, None].to(rois)
    return roi_align(gt_masks, rois, (M, M), 1.0)[:, 0]


def maskrcnn_loss(mask_logits, proposals, gt_masks, gt_labels, mask_matched_idxs):
    # type: (Tensor, List[Tensor], List[Tensor], List[Tensor], List[Tensor]) -> Tensor
    """
    Args:
        proposals (list[BoxList])
        mask_logits (Tensor)
        targets (list[BoxList])

    Return:
        mask_loss (Tensor): scalar tensor containing the loss
    """

    discretization_size = mask_logits.shape[-1]
    labels = [gt_label[idxs] for gt_label, idxs in zip(gt_labels, mask_matched_idxs)]
    mask_targets = [
        project_masks_on_boxes(m, p, i, discretization_size) for m, p, i in zip(gt_masks, proposals, mask_matched_idxs)
    ]

    labels = torch.cat(labels, dim=0)
    mask_targets = torch.cat(mask_targets, dim=0)

    # torch.mean (in binary_cross_entropy_with_logits) doesn't
    # accept empty tensors, so handle it separately
    if mask_targets.numel() == 0:
        return mask_logits.sum() * 0

    mask_loss = F.binary_cross_entropy_with_logits(
        mask_logits[torch.arange(labels.shape[0], device=labels.device), labels], mask_targets
    )
    return mask_loss


def keypoints_to_heatmap(keypoints, rois, heatmap_size):
    # type: (Tensor, Tensor, int) -> Tuple[Tensor, Tensor]
    offset_x = rois[:, 0]
    offset_y = rois[:, 1]
    scale_x = heatmap_size / (rois[:, 2] - rois[:, 0])
    scale_y = heatmap_size / (rois[:, 3] - rois[:, 1])

    offset_x = offset_x[:, None]
    offset_y = offset_y[:, None]
    scale_x = scale_x[:, None]
    scale_y = scale_y[:, None]

    x = keypoints[..., 0]
    y = keypoints[..., 1]

    x_boundary_inds = x == rois[:, 2][:, None]
    y_boundary_inds = y == rois[:, 3][:, None]

    x = (x - offset_x) * scale_x
    x = x.floor().long()
    y = (y - offset_y) * scale_y
    y = y.floor().long()

    x[x_boundary_inds] = heatmap_size - 1
    y[y_boundary_inds] = heatmap_size - 1

    valid_loc = (x >= 0) & (y >= 0) & (x < heatmap_size) & (y < heatmap_size)
    vis = keypoints[..., 2] > 0
    valid = (valid_loc & vis).long()

    lin_ind = y * heatmap_size + x
    heatmaps = lin_ind * valid

    return heatmaps, valid


def _onnx_heatmaps_to_keypoints(
        maps, maps_i, roi_map_width, roi_map_height, widths_i, heights_i, offset_x_i, offset_y_i
):
    num_keypoints = torch.scalar_tensor(maps.size(1), dtype=torch.int64)

    width_correction = widths_i / roi_map_width
    height_correction = heights_i / roi_map_height

    roi_map = F.interpolate(
        maps_i[:, None], size=(int(roi_map_height), int(roi_map_width)), mode="bicubic", align_corners=False
    )[:, 0]

    w = torch.scalar_tensor(roi_map.size(2), dtype=torch.int64)
    pos = roi_map.reshape(num_keypoints, -1).argmax(dim=1)

    x_int = pos % w
    y_int = (pos - x_int) // w

    x = (torch.tensor(0.5, dtype=torch.float32) + x_int.to(dtype=torch.float32)) * width_correction.to(
        dtype=torch.float32
    )
    y = (torch.tensor(0.5, dtype=torch.float32) + y_int.to(dtype=torch.float32)) * height_correction.to(
        dtype=torch.float32
    )

    xy_preds_i_0 = x + offset_x_i.to(dtype=torch.float32)
    xy_preds_i_1 = y + offset_y_i.to(dtype=torch.float32)
    xy_preds_i_2 = torch.ones(xy_preds_i_1.shape, dtype=torch.float32)
    xy_preds_i = torch.stack(
        [
            xy_preds_i_0.to(dtype=torch.float32),
            xy_preds_i_1.to(dtype=torch.float32),
            xy_preds_i_2.to(dtype=torch.float32),
        ],
        0,
    )

    # TODO: simplify when indexing without rank will be supported by ONNX
    base = num_keypoints * num_keypoints + num_keypoints + 1
    ind = torch.arange(num_keypoints)
    ind = ind.to(dtype=torch.int64) * base
    end_scores_i = (
        roi_map.index_select(1, y_int.to(dtype=torch.int64))
        .index_select(2, x_int.to(dtype=torch.int64))
        .view(-1)
        .index_select(0, ind.to(dtype=torch.int64))
    )

    return xy_preds_i, end_scores_i


@torch.jit._script_if_tracing
def _onnx_heatmaps_to_keypoints_loop(
        maps, rois, widths_ceil, heights_ceil, widths, heights, offset_x, offset_y, num_keypoints
):
    xy_preds = torch.zeros((0, 3, int(num_keypoints)), dtype=torch.float32, device=maps.device)
    end_scores = torch.zeros((0, int(num_keypoints)), dtype=torch.float32, device=maps.device)

    for i in range(int(rois.size(0))):
        xy_preds_i, end_scores_i = _onnx_heatmaps_to_keypoints(
            maps, maps[i], widths_ceil[i], heights_ceil[i], widths[i], heights[i], offset_x[i], offset_y[i]
        )
        xy_preds = torch.cat((xy_preds.to(dtype=torch.float32), xy_preds_i.unsqueeze(0).to(dtype=torch.float32)), 0)
        end_scores = torch.cat(
            (end_scores.to(dtype=torch.float32), end_scores_i.to(dtype=torch.float32).unsqueeze(0)), 0
        )
    return xy_preds, end_scores


def heatmaps_to_keypoints(maps, rois):
    """Extract predicted keypoint locations from heatmaps. Output has shape
    (#rois, 4, #keypoints) with the 4 rows corresponding to (x, y, logit, prob)
    for each keypoint.
    """
    # This function converts a discrete image coordinate in a HEATMAP_SIZE x
    # HEATMAP_SIZE image to a continuous keypoint coordinate. We maintain
    # consistency with keypoints_to_heatmap_labels by using the conversion from
    # Heckbert 1990: c = d + 0.5, where d is a discrete coordinate and c is a
    # continuous coordinate.
    offset_x = rois[:, 0]
    offset_y = rois[:, 1]

    widths = rois[:, 2] - rois[:, 0]
    heights = rois[:, 3] - rois[:, 1]
    widths = widths.clamp(min=1)
    heights = heights.clamp(min=1)
    widths_ceil = widths.ceil()
    heights_ceil = heights.ceil()

    num_keypoints = maps.shape[1]

    if torchvision._is_tracing():
        xy_preds, end_scores = _onnx_heatmaps_to_keypoints_loop(
            maps,
            rois,
            widths_ceil,
            heights_ceil,
            widths,
            heights,
            offset_x,
            offset_y,
            torch.scalar_tensor(num_keypoints, dtype=torch.int64),
        )
        return xy_preds.permute(0, 2, 1), end_scores

    xy_preds = torch.zeros((len(rois), 3, num_keypoints), dtype=torch.float32, device=maps.device)
    end_scores = torch.zeros((len(rois), num_keypoints), dtype=torch.float32, device=maps.device)
    for i in range(len(rois)):
        roi_map_width = int(widths_ceil[i].item())
        roi_map_height = int(heights_ceil[i].item())
        width_correction = widths[i] / roi_map_width
        height_correction = heights[i] / roi_map_height
        roi_map = F.interpolate(
            maps[i][:, None], size=(roi_map_height, roi_map_width), mode="bicubic", align_corners=False
        )[:, 0]
        # roi_map_probs = scores_to_probs(roi_map.copy())
        w = roi_map.shape[2]
        pos = roi_map.reshape(num_keypoints, -1).argmax(dim=1)

        x_int = pos % w
        y_int = torch.div(pos - x_int, w, rounding_mode="floor")
        # assert (roi_map_probs[k, y_int, x_int] ==
        #         roi_map_probs[k, :, :].max())
        x = (x_int.float() + 0.5) * width_correction
        y = (y_int.float() + 0.5) * height_correction
        xy_preds[i, 0, :] = x + offset_x[i]
        xy_preds[i, 1, :] = y + offset_y[i]
        xy_preds[i, 2, :] = 1
        end_scores[i, :] = roi_map[torch.arange(num_keypoints, device=roi_map.device), y_int, x_int]

    return xy_preds.permute(0, 2, 1), end_scores


def keypointrcnn_loss(keypoint_logits, proposals, gt_keypoints, keypoint_matched_idxs):
    # type: (Tensor, List[Tensor], List[Tensor], List[Tensor]) -> Tensor
    N, K, H, W = keypoint_logits.shape
    if H != W:
        raise ValueError(
            f"keypoint_logits height and width (last two elements of shape) should be equal. Instead got H = {H} and W = {W}"
        )
    discretization_size = H
    heatmaps = []
    valid = []
    for proposals_per_image, gt_kp_in_image, midx in zip(proposals, gt_keypoints, keypoint_matched_idxs):
        kp = gt_kp_in_image[midx]
        heatmaps_per_image, valid_per_image = keypoints_to_heatmap(kp, proposals_per_image, discretization_size)

        heatmaps.append(heatmaps_per_image.view(-1))
        valid.append(valid_per_image.view(-1))

    keypoint_targets = torch.cat(heatmaps, dim=0)
    valid = torch.cat(valid, dim=0).to(dtype=torch.uint8)
    valid = torch.where(valid)[0]

    # torch.mean (in binary_cross_entropy_with_logits) doesn't
    # accept empty tensors, so handle it sepaartely
    if keypoint_targets.numel() == 0 or len(valid) == 0:
        return keypoint_logits.sum() * 0

    keypoint_logits = keypoint_logits.view(N * K, H * W)

    keypoint_loss = F.cross_entropy(keypoint_logits[valid], keypoint_targets[valid])
    return keypoint_loss


def keypointrcnn_inference(x, boxes):
    # type: (Tensor, List[Tensor]) -> Tuple[List[Tensor], List[Tensor]]
    kp_probs = []
    kp_scores = []

    boxes_per_image = [box.size(0) for box in boxes]
    x2 = x.split(boxes_per_image, dim=0)

    for xx, bb in zip(x2, boxes):
        kp_prob, scores = heatmaps_to_keypoints(xx, bb)
        kp_probs.append(kp_prob)
        kp_scores.append(scores)

    return kp_probs, kp_scores


def _onnx_expand_boxes(boxes, scale):
    # type: (Tensor, float) -> Tensor
    w_half = (boxes[:, 2] - boxes[:, 0]) * 0.5
    h_half = (boxes[:, 3] - boxes[:, 1]) * 0.5
    x_c = (boxes[:, 2] + boxes[:, 0]) * 0.5
    y_c = (boxes[:, 3] + boxes[:, 1]) * 0.5

    w_half = w_half.to(dtype=torch.float32) * scale
    h_half = h_half.to(dtype=torch.float32) * scale

    boxes_exp0 = x_c - w_half
    boxes_exp1 = y_c - h_half
    boxes_exp2 = x_c + w_half
    boxes_exp3 = y_c + h_half
    boxes_exp = torch.stack((boxes_exp0, boxes_exp1, boxes_exp2, boxes_exp3), 1)
    return boxes_exp


# the next two functions should be merged inside Masker
# but are kept here for the moment while we need them
# temporarily for paste_mask_in_image
def expand_boxes(boxes, scale):
    # type: (Tensor, float) -> Tensor
    if torchvision._is_tracing():
        return _onnx_expand_boxes(boxes, scale)
    w_half = (boxes[:, 2] - boxes[:, 0]) * 0.5
    h_half = (boxes[:, 3] - boxes[:, 1]) * 0.5
    x_c = (boxes[:, 2] + boxes[:, 0]) * 0.5
    y_c = (boxes[:, 3] + boxes[:, 1]) * 0.5

    w_half *= scale
    h_half *= scale

    boxes_exp = torch.zeros_like(boxes)
    boxes_exp[:, 0] = x_c - w_half
    boxes_exp[:, 2] = x_c + w_half
    boxes_exp[:, 1] = y_c - h_half
    boxes_exp[:, 3] = y_c + h_half
    return boxes_exp


@torch.jit.unused
def expand_masks_tracing_scale(M, padding):
    # type: (int, int) -> float
    return torch.tensor(M + 2 * padding).to(torch.float32) / torch.tensor(M).to(torch.float32)


def expand_masks(mask, padding):
    # type: (Tensor, int) -> Tuple[Tensor, float]
    M = mask.shape[-1]
    if torch._C._get_tracing_state():  # could not import is_tracing(), not sure why
        scale = expand_masks_tracing_scale(M, padding)
    else:
        scale = float(M + 2 * padding) / M
    padded_mask = F.pad(mask, (padding,) * 4)
    return padded_mask, scale


def paste_mask_in_image(mask, box, im_h, im_w):
    # type: (Tensor, Tensor, int, int) -> Tensor
    TO_REMOVE = 1
    w = int(box[2] - box[0] + TO_REMOVE)
    h = int(box[3] - box[1] + TO_REMOVE)
    w = max(w, 1)
    h = max(h, 1)

    # Set shape to [batchxCxHxW]
    mask = mask.expand((1, 1, -1, -1))

    # Resize ins
    mask = F.interpolate(mask, size=(h, w), mode="bilinear", align_corners=False)
    mask = mask[0][0]

    im_mask = torch.zeros((im_h, im_w), dtype=mask.dtype, device=mask.device)
    x_0 = max(box[0], 0)
    x_1 = min(box[2] + 1, im_w)
    y_0 = max(box[1], 0)
    y_1 = min(box[3] + 1, im_h)

    im_mask[y_0:y_1, x_0:x_1] = mask[(y_0 - box[1]): (y_1 - box[1]), (x_0 - box[0]): (x_1 - box[0])]
    return im_mask


def _onnx_paste_mask_in_image(mask, box, im_h, im_w):
    one = torch.ones(1, dtype=torch.int64)
    zero = torch.zeros(1, dtype=torch.int64)

    w = box[2] - box[0] + one
    h = box[3] - box[1] + one
    w = torch.max(torch.cat((w, one)))
    h = torch.max(torch.cat((h, one)))

    # Set shape to [batchxCxHxW]
    mask = mask.expand((1, 1, mask.size(0), mask.size(1)))

    # Resize ins
    mask = F.interpolate(mask, size=(int(h), int(w)), mode="bilinear", align_corners=False)
    mask = mask[0][0]

    x_0 = torch.max(torch.cat((box[0].unsqueeze(0), zero)))
    x_1 = torch.min(torch.cat((box[2].unsqueeze(0) + one, im_w.unsqueeze(0))))
    y_0 = torch.max(torch.cat((box[1].unsqueeze(0), zero)))
    y_1 = torch.min(torch.cat((box[3].unsqueeze(0) + one, im_h.unsqueeze(0))))

    unpaded_im_mask = mask[(y_0 - box[1]): (y_1 - box[1]), (x_0 - box[0]): (x_1 - box[0])]

    # TODO : replace below with a dynamic padding when support is added in ONNX

    # pad y
    zeros_y0 = torch.zeros(y_0, unpaded_im_mask.size(1))
    zeros_y1 = torch.zeros(im_h - y_1, unpaded_im_mask.size(1))
    concat_0 = torch.cat((zeros_y0, unpaded_im_mask.to(dtype=torch.float32), zeros_y1), 0)[0:im_h, :]
    # pad x
    zeros_x0 = torch.zeros(concat_0.size(0), x_0)
    zeros_x1 = torch.zeros(concat_0.size(0), im_w - x_1)
    im_mask = torch.cat((zeros_x0, concat_0, zeros_x1), 1)[:, :im_w]
    return im_mask


@torch.jit._script_if_tracing
def _onnx_paste_masks_in_image_loop(masks, boxes, im_h, im_w):
    res_append = torch.zeros(0, im_h, im_w)
    for i in range(masks.size(0)):
        mask_res = _onnx_paste_mask_in_image(masks[i][0], boxes[i], im_h, im_w)
        mask_res = mask_res.unsqueeze(0)
        res_append = torch.cat((res_append, mask_res))
    return res_append


def paste_masks_in_image(masks, boxes, img_shape, padding=1):
    # type: (Tensor, Tensor, Tuple[int, int], int) -> Tensor
    masks, scale = expand_masks(masks, padding=padding)
    boxes = expand_boxes(boxes, scale).to(dtype=torch.int64)
    im_h, im_w = img_shape

    if torchvision._is_tracing():
        return _onnx_paste_masks_in_image_loop(
            masks, boxes, torch.scalar_tensor(im_h, dtype=torch.int64), torch.scalar_tensor(im_w, dtype=torch.int64)
        )[:, None]
    res = [paste_mask_in_image(m[0], b, im_h, im_w) for m, b in zip(masks, boxes)]
    if len(res) > 0:
        ret = torch.stack(res, dim=0)[:, None]
    else:
        ret = masks.new_empty((0, 1, im_h, im_w))
    return ret


class RoIHeads(nn.Module):
    __annotations__ = {
        "box_coder": det_utils.BoxCoder,
        "proposal_matcher": det_utils.Matcher,
        "fg_bg_sampler": det_utils.BalancedPositiveNegativeSampler,
    }

    def __init__(
            self,
            box_roi_pool,
            box_head,
            box_predictor,
            # Faster R-CNN training
            fg_iou_thresh,
            bg_iou_thresh,
            batch_size_per_image,
            positive_fraction,
            bbox_reg_weights,
            # Faster R-CNN inference
            score_thresh,
            nms_thresh,
            detections_per_img,
            # Line
            line_roi_pool=None,
            line_head=None,
            line_predictor=None,

            # point parameters
            point_roi_pool=None,
            point_head=None,
            point_predictor=None,

            ins_head=None,
            ins_predictor=None,
            ins_roi_pool=None,

            # arc parameters
            arc_roi_pool=None,
            arc_head=None,
            arc_predictor=None,

            # Mask
            mask_roi_pool=None,
            mask_head=None,
            mask_predictor=None,
            keypoint_roi_pool=None,
            keypoint_head=None,
            keypoint_predictor=None,

            detect_point=True,
            detect_line=False,
            detect_arc=False,
            detect_circle=False,
    ):
        super().__init__()

        self.box_similarity = box_ops.box_iou
        # assign ground-truth boxes for each proposal
        self.proposal_matcher = det_utils.Matcher(fg_iou_thresh, bg_iou_thresh, allow_low_quality_matches=False)

        self.fg_bg_sampler = det_utils.BalancedPositiveNegativeSampler(batch_size_per_image, positive_fraction)

        if bbox_reg_weights is None:
            bbox_reg_weights = (10.0, 10.0, 5.0, 5.0)
        self.box_coder = det_utils.BoxCoder(bbox_reg_weights)

        self.box_roi_pool = box_roi_pool
        self.box_head = box_head
        self.box_predictor = box_predictor

        self.score_thresh = score_thresh
        self.nms_thresh = nms_thresh
        self.detections_per_img = detections_per_img

        self.line_roi_pool = line_roi_pool
        self.line_head = line_head
        self.line_predictor = line_predictor

        self.point_roi_pool = point_roi_pool
        self.point_head = point_head
        self.point_predictor = point_predictor

        self.arc_roi_pool = arc_roi_pool
        self.arc_head = arc_head
        self.arc_predictor = arc_predictor

        self.ins_roi_pool = ins_roi_pool
        self.ins_head = ins_head
        self.ins_predictor = ins_predictor


        self.mask_roi_pool = mask_roi_pool
        self.mask_head = mask_head
        self.mask_predictor = mask_predictor

        self.keypoint_roi_pool = keypoint_roi_pool
        self.keypoint_head = keypoint_head
        self.keypoint_predictor = keypoint_predictor

        self.detect_point =detect_point
        self.detect_line =detect_line
        self.detect_arc =detect_arc
        self.detect_circle=detect_circle

        self.channel_compress = nn.Sequential(
            nn.Conv2d(256, 8, kernel_size=1),
            nn.BatchNorm2d(8),
            nn.ReLU(inplace=True)
        )

    def has_mask(self):
        if self.mask_roi_pool is None:
            return False
        if self.mask_head is None:
            return False
        if self.mask_predictor is None:
            return False
        return True

    def has_keypoint(self):
        if self.keypoint_roi_pool is None:
            return False
        if self.keypoint_head is None:
            return False
        if self.keypoint_predictor is None:
            return False
        return True

    def has_line(self):
        # if self.line_roi_pool is None:
        #     return False
        if self.line_head is None:
            return False
        # if self.line_predictor is None:
        #     return False
        return True

    def has_point(self):
        # if self.line_roi_pool is None:
        #     return False
        if self.point_head is None:
            return False
        # if self.line_predictor is None:
        #     return False
        return True

    def has_arc(self):
        # if self.line_roi_pool is None:
        #     return False
        if self.arc_head is None:
            return False
        # if self.line_predictor is None:
        #     return False
        return True

    def has_ins(self):
        # if self.line_roi_pool is None:
        #     return False
        if self.ins_head is None:
            return False
        # if self.line_predictor is None:
        #     return False
        return True

    def assign_targets_to_proposals(self, proposals, gt_boxes, gt_labels):
        # type: (List[Tensor], List[Tensor], List[Tensor]) -> Tuple[List[Tensor], List[Tensor]]
        matched_idxs = []
        labels = []
        for proposals_in_image, gt_boxes_in_image, gt_labels_in_image in zip(proposals, gt_boxes, gt_labels):

            if gt_boxes_in_image.numel() == 0:
                # Background image
                device = proposals_in_image.device
                clamped_matched_idxs_in_image = torch.zeros(
                    (proposals_in_image.shape[0],), dtype=torch.int64, device=device
                )
                labels_in_image = torch.zeros((proposals_in_image.shape[0],), dtype=torch.int64, device=device)
            else:
                #  set to self.box_similarity when https://github.com/pytorch/pytorch/issues/27495 lands
                match_quality_matrix = box_ops.box_iou(gt_boxes_in_image, proposals_in_image)
                matched_idxs_in_image = self.proposal_matcher(match_quality_matrix)

                clamped_matched_idxs_in_image = matched_idxs_in_image.clamp(min=0)

                labels_in_image = gt_labels_in_image[clamped_matched_idxs_in_image]
                labels_in_image = labels_in_image.to(dtype=torch.int64)

                # Label background (below the low threshold)
                bg_inds = matched_idxs_in_image == self.proposal_matcher.BELOW_LOW_THRESHOLD
                labels_in_image[bg_inds] = 0

                # Label ignore proposals (between low and high thresholds)
                ignore_inds = matched_idxs_in_image == self.proposal_matcher.BETWEEN_THRESHOLDS
                labels_in_image[ignore_inds] = -1  # -1 is ignored by sampler

            matched_idxs.append(clamped_matched_idxs_in_image)
            labels.append(labels_in_image)
        return matched_idxs, labels

    def subsample(self, labels):
        # type: (List[Tensor]) -> List[Tensor]
        sampled_pos_inds, sampled_neg_inds = self.fg_bg_sampler(labels)
        sampled_inds = []
        for img_idx, (pos_inds_img, neg_inds_img) in enumerate(zip(sampled_pos_inds, sampled_neg_inds)):
            img_sampled_inds = torch.where(pos_inds_img | neg_inds_img)[0]
            sampled_inds.append(img_sampled_inds)
        return sampled_inds

    def add_gt_proposals(self, proposals, gt_boxes):
        # type: (List[Tensor], List[Tensor]) -> List[Tensor]
        proposals = [torch.cat((proposal, gt_box)) for proposal, gt_box in zip(proposals, gt_boxes)]

        return proposals

    def check_targets(self, targets):
        # type: (Optional[List[Dict[str, Tensor]]]) -> None
        if targets is None:
            raise ValueError("targets should not be None")
        if not all(["boxes" in t for t in targets]):
            raise ValueError("Every element of targets should have a boxes key")
        if not all(["labels" in t for t in targets]):
            raise ValueError("Every element of targets should have a labels key")
        if self.has_mask():
            if not all(["masks" in t for t in targets]):
                raise ValueError("Every element of targets should have a masks key")

    def select_training_samples(
            self,
            proposals,  # type: List[Tensor]
            targets,  # type: Optional[List[Dict[str, Tensor]]]
    ):
        # type: (...) -> Tuple[List[Tensor], List[Tensor], List[Tensor], List[Tensor]]
        self.check_targets(targets)
        if targets is None:
            raise ValueError("targets should not be None")
        dtype = proposals[0].dtype
        device = proposals[0].device

        gt_boxes = [t["boxes"].to(dtype) for t in targets]
        gt_labels = [t["labels"] for t in targets]

        # append ground-truth bboxes to propos
        proposals = self.add_gt_proposals(proposals, gt_boxes)

        # get matching gt indices for each proposal
        matched_idxs, labels = self.assign_targets_to_proposals(proposals, gt_boxes, gt_labels)
        # sample a fixed proportion of positive-negative proposals
        sampled_inds = self.subsample(labels)
        matched_gt_boxes = []
        num_images = len(proposals)
        for img_id in range(num_images):
            img_sampled_inds = sampled_inds[img_id]
            proposals[img_id] = proposals[img_id][img_sampled_inds]
            labels[img_id] = labels[img_id][img_sampled_inds]
            matched_idxs[img_id] = matched_idxs[img_id][img_sampled_inds]

            gt_boxes_in_image = gt_boxes[img_id]
            if gt_boxes_in_image.numel() == 0:
                gt_boxes_in_image = torch.zeros((1, 4), dtype=dtype, device=device)
            matched_gt_boxes.append(gt_boxes_in_image[matched_idxs[img_id]])

        regression_targets = self.box_coder.encode(matched_gt_boxes, proposals)
        return proposals, matched_idxs, labels, regression_targets

    def postprocess_detections(
            self,
            class_logits,  # type: Tensor
            box_regression,  # type: Tensor
            proposals,  # type: List[Tensor]
            image_shapes,  # type: List[Tuple[int, int]]
    ):
        # type: (...) -> Tuple[List[Tensor], List[Tensor], List[Tensor]]
        device = class_logits.device
        num_classes = class_logits.shape[-1]

        boxes_per_image = [boxes_in_image.shape[0] for boxes_in_image in proposals]
        pred_boxes = self.box_coder.decode(box_regression, proposals)

        pred_scores = F.softmax(class_logits, -1)

        pred_boxes_list = pred_boxes.split(boxes_per_image, 0)
        pred_scores_list = pred_scores.split(boxes_per_image, 0)

        all_boxes = []
        all_scores = []
        all_labels = []
        for boxes, scores, image_shape in zip(pred_boxes_list, pred_scores_list, image_shapes):
            boxes = box_ops.clip_boxes_to_image(boxes, image_shape)

            # create labels for each prediction
            labels = torch.arange(num_classes, device=device)
            labels = labels.view(1, -1).expand_as(scores)

            # remove predictions with the background label
            boxes = boxes[:, 1:]
            scores = scores[:, 1:]
            labels = labels[:, 1:]

            # batch everything, by making every class prediction be a separate instance
            boxes = boxes.reshape(-1, 4)
            scores = scores.reshape(-1)
            labels = labels.reshape(-1)

            # remove low scoring boxes
            inds = torch.where(scores > self.score_thresh)[0]
            boxes, scores, labels = boxes[inds], scores[inds], labels[inds]

            # remove empty boxes
            keep = box_ops.remove_small_boxes(boxes, min_size=1e-2)
            boxes, scores, labels = boxes[keep], scores[keep], labels[keep]

            # non-maximum suppression, independently done per class
            keep = box_ops.batched_nms(boxes, scores, labels, self.nms_thresh)
            # keep only topk scoring predictions
            keep = keep[: self.detections_per_img]
            boxes, scores, labels = boxes[keep], scores[keep], labels[keep]

            all_boxes.append(boxes)
            all_scores.append(scores)
            all_labels.append(labels)

        return all_boxes, all_scores, all_labels

    def forward(
            self,
            features,  # type: Dict[str, Tensor]
            proposals,  # type: List[Tensor]
            image_shapes,  # type: List[Tuple[int, int]]
            targets=None,  # type: Optional[List[Dict[str, Tensor]]]
    ):
        # type: (...) -> Tuple[List[Dict[str, Tensor]], Dict[str, Tensor]]
        """
        Args:
            features (List[Tensor])
            proposals (List[Tensor[N, 4]])
            image_shapes (List[Tuple[H, W]])
            targets (List[Dict])
        """

        print(f'roihead forward!!!')
        if targets is not None:
            for t in targets:
                # TODO: https://github.com/pytorch/pytorch/issues/26731
                floating_point_types = (torch.float, torch.double, torch.half)
                if not t["boxes"].dtype in floating_point_types:
                    raise TypeError(f"target boxes must of float type, instead got {t['boxes'].dtype}")
                if not t["labels"].dtype == torch.int64:
                    raise TypeError(f"target labels must of int64 type, instead got {t['labels'].dtype}")
                if self.has_keypoint():
                    if not t["keypoints"].dtype == torch.float32:
                        raise TypeError(f"target keypoints must of float type, instead got {t['keypoints'].dtype}")

        if self.training:
            proposals, matched_idxs, labels, regression_targets = self.select_training_samples(proposals, targets)
        else:
            if targets is not None:
                proposals, matched_idxs, labels, regression_targets = self.select_training_samples(proposals, targets)
            else:
                labels = None
                regression_targets = None
                matched_idxs = None
        device=features['0'].device

        box_features = self.box_roi_pool(features, proposals, image_shapes)
        box_features = self.box_head(box_features)


        class_logits, box_regression = self.box_predictor(box_features)

        result: List[Dict[str, torch.Tensor]] = []
        losses = {}
        # _, C, H, W = features['0'].shape  # å¿½ç¥ batch_sizeï¼å ä¸ºæä»¬åªå³å¿ C, H, W
        if self.training:
            if labels is None:
                raise ValueError("labels cannot be None")
            if regression_targets is None:
                raise ValueError("regression_targets cannot be None")
            print(f'boxes compute losses')
            loss_classifier, loss_box_reg = fastrcnn_loss(class_logits, box_regression, labels, regression_targets)
            losses = {"loss_classifier": loss_classifier, "loss_box_reg": loss_box_reg}
        else:
            if targets is not None:
                loss_classifier, loss_box_reg = fastrcnn_loss(class_logits, box_regression, labels, regression_targets)
                losses = {"loss_classifier": loss_classifier, "loss_box_reg": loss_box_reg}

            boxes, scores, labels = self.postprocess_detections(class_logits, box_regression, proposals,
                                                                image_shapes)
            num_images = len(boxes)
            for i in range(num_images):
                result.append(
                    {
                        "boxes": boxes[i],
                        "labels": labels[i],
                        "scores": scores[i],
                    }
                )

        if  self.has_line() and self.detect_line:
            print(f'roi_heads forward has_line()!!!!')
            # print(f'labels:{labels}')
            line_proposals = [p["boxes"] for p in result]
            point_proposals = [p["boxes"] for p in result]
            print(f'boxes_proposals:{len(line_proposals)}')

            # if line_proposals is None or len(line_proposals) == 0:
            #     # è¿åç©ºç¹å¾æèè·³è¿è¯¥é¨åè®¡ç®
            #     return torch.empty(0, C, H, W).to(features['0'].device)

            if self.training:
                # during training, only focus on positive boxes
                num_images = len(proposals)
                print(f'num_images:{num_images}')
                line_proposals = []
                point_proposals = []
                arc_proposals = []

                pos_matched_idxs = []
                line_pos_matched_idxs = []
                point_pos_matched_idxs = []
                if matched_idxs is None:
                    raise ValueError("if in trainning, matched_idxs should not be None")

                for img_id in range(num_images):
                    pos = torch.where(labels[img_id] > 0)[0]

                    line_pos=torch.where(labels[img_id] ==2)[0]
                    # point_pos=torch.where(labels[img_id] ==1)[0]

                    line_proposals.append(proposals[img_id][line_pos])
                    # point_proposals.append(proposals[img_id][point_pos])

                    line_pos_matched_idxs.append(matched_idxs[img_id][line_pos])
                    # point_pos_matched_idxs.append(matched_idxs[img_id][point_pos])

                    # pos_matched_idxs.append(matched_idxs[img_id][pos])
            else:
                if targets is not None:

                    pos_matched_idxs = []
                    num_images = len(proposals)
                    line_proposals = []


                    line_pos_matched_idxs = []
                    print(f'val num_images:{num_images}')
                    if matched_idxs is None:
                        raise ValueError("if in trainning, matched_idxs should not be None")

                    for img_id in range(num_images):
                        # pos = torch.where(labels[img_id] > 0)[0]

                        line_pos = torch.where(labels[img_id] == 2)[0]

                        line_proposals.append(proposals[img_id][line_pos])

                        line_pos_matched_idxs.append(matched_idxs[img_id][line_pos])

                else:
                    pos_matched_idxs = None

            line_proposals_valid=self.check_proposals(line_proposals)
            if line_proposals_valid:

                feature_logits = self.line_forward3(features, image_shapes, line_proposals)

                loss_line = None
                loss_line_iou =None

                if self.training:

                    if targets is None or pos_matched_idxs is None:
                        raise ValueError("both targets and pos_matched_idxs should not be None when in training mode")

                    gt_lines = [t["lines"] for t in targets if "lines" in t]


                    # print(f'gt_lines:{gt_lines[0].shape}')
                    h, w = targets[0]["img_size"]
                    img_size = h

                    gt_lines_tensor=torch.zeros(0,0)
                    if len(gt_lines)>0:
                        gt_lines_tensor = torch.cat(gt_lines)
                        print(f'gt_lines_tensor:{gt_lines_tensor.shape}')


                    if gt_lines_tensor.shape[0]>0 :
                        print(f'start to lines_point_pair_loss')
                        loss_line = lines_point_pair_loss(
                            feature_logits, line_proposals, gt_lines, line_pos_matched_idxs
                        )
                        loss_line_iou = line_iou_loss(feature_logits, line_proposals, gt_lines, line_pos_matched_idxs, img_size)


                    if  loss_line is None:
                        print(f'loss_line is None111')
                        loss_line = torch.tensor(0.0, device=device)

                    if loss_line_iou is None:
                        print(f'loss_line_iou is None111')
                        loss_line_iou = torch.tensor(0.0, device=device)

                    loss_line = {"loss_line": loss_line}
                    loss_line_iou = {'loss_line_iou': loss_line_iou}

                else:
                    if targets is not None:
                        h, w = targets[0]["img_size"]
                        img_size = h
                        gt_lines = [t["lines"] for t in targets if "lines" in t]

                        gt_lines_tensor = torch.zeros(0, 0)
                        if len(gt_lines)>0:
                            gt_lines_tensor = torch.cat(gt_lines)


                        if gt_lines_tensor.shape[0] > 0 and feature_logits is not None:
                            loss_line = lines_point_pair_loss(
                                feature_logits, line_proposals, gt_lines, line_pos_matched_idxs
                            )
                            print(f'compute_line_loss:{loss_line}')
                            loss_line_iou = line_iou_loss(feature_logits , line_proposals, gt_lines, line_pos_matched_idxs,
                                                          img_size)


                        if  loss_line is None:
                            print(f'loss_line is None')
                            loss_line=torch.tensor(0.0,device=device)

                        if  loss_line_iou is None:
                            print(f'loss_line_iou is None')
                            loss_line_iou=torch.tensor(0.0,device=device)


                        loss_line = {"loss_line": loss_line}
                        loss_line_iou = {'loss_line_iou': loss_line_iou}


                    else:
                        loss_line = {}
                        loss_line_iou = {}
                        if feature_logits is None or line_proposals is None:
                            raise ValueError(
                                "both keypoint_logits and keypoint_proposals should not be None when not in training mode"
                            )

                        if feature_logits is not None:
                            lines_probs, lines_scores = line_inference(feature_logits,line_proposals)
                            for keypoint_prob, kps, r in zip(lines_probs, lines_scores, result):
                                r["lines"] = keypoint_prob
                                r["lines_scores"] = kps


                print(f'loss_line11111:{loss_line}')
                losses.update(loss_line)
                losses.update(loss_line_iou)
                print(f'losses:{losses}')
        if self.has_point() and self.detect_point:
            print(f'roi_heads forward has_point()!!!!')
            # print(f'labels:{labels}')
            point_proposals = [p["boxes"] for p in result]
            print(f'boxes_proposals:{len(point_proposals)}')

            # if line_proposals is None or len(line_proposals) == 0:
            #     # è¿åç©ºç¹å¾æèè·³è¿è¯¥é¨åè®¡ç®
            #     return torch.empty(0, C, H, W).to(features['0'].device)

            if self.training:
                # during training, only focus on positive boxes
                num_images = len(proposals)
                print(f'num_images:{num_images}')
                point_proposals = []
                point_pos_matched_idxs = []
                if matched_idxs is None:
                    raise ValueError("if in trainning, matched_idxs should not be None")
                for img_id in range(num_images):
                    point_pos=torch.where(labels[img_id] ==1)[0]
                    point_proposals.append(proposals[img_id][point_pos])
                    point_pos_matched_idxs.append(matched_idxs[img_id][point_pos])
            else:
                if targets is not None:

                    num_images = len(proposals)
                    point_proposals = []

                    point_pos_matched_idxs = []
                    print(f'val num_images:{num_images}')
                    if matched_idxs is None:
                        raise ValueError("if in trainning, matched_idxs should not be None")

                    for img_id in range(num_images):
                        point_pos = torch.where(labels[img_id] == 1)[0]
                        point_proposals.append(proposals[img_id][point_pos])
                        point_pos_matched_idxs.append(matched_idxs[img_id][point_pos])

                else:
                    pos_matched_idxs = None

            point_proposals_valid = self.check_proposals(point_proposals)

            if point_proposals_valid:

                feature_logits = self.point_forward1(features, image_shapes, point_proposals)

                loss_point=None

                if self.training:

                    if targets is None or point_pos_matched_idxs is None:
                        raise ValueError("both targets and pos_matched_idxs should not be None when in training mode")

                    gt_points = [t["points"] for t in targets if "points" in t]

                    print(f'gt_points:{gt_points[0].shape}')
                    h, w = targets[0]["img_size"]
                    img_size = h

                    gt_points_tensor = torch.zeros(0, 0)
                    if len(gt_points) > 0:
                        gt_points_tensor = torch.cat(gt_points)
                        print(f'gt_points_tensor:{gt_points_tensor.shape}')

                    if gt_points_tensor.shape[0] > 0:
                        print(f'start to compute point_loss')

                        loss_point=compute_point_loss(feature_logits,point_proposals,gt_points,point_pos_matched_idxs)

                    if loss_point is None:
                        print(f'loss_point is None111')
                        loss_point = torch.tensor(0.0, device=device)

                    loss_point = {"loss_point": loss_point}

                else:
                    if targets is not None:
                        h, w = targets[0]["img_size"]
                        img_size = h
                        gt_points = [t["points"] for t in targets if "points" in t]

                        gt_points_tensor = torch.zeros(0, 0)
                        if len(gt_points) > 0:
                            gt_points_tensor = torch.cat(gt_points)
                            print(f'gt_points_tensor:{gt_points_tensor.shape}')

                        if gt_points_tensor.shape[0] > 0:
                            print(f'start to compute point_loss')

                            loss_point = compute_point_loss(feature_logits, point_proposals, gt_points,
                                                            point_pos_matched_idxs)

                        if loss_point is None:
                            print(f'loss_point is None111')
                            loss_point = torch.tensor(0.0, device=device)

                        loss_point = {"loss_point": loss_point}


                    else:
                        loss_point = {}
                        if feature_logits is None or point_proposals is None:
                            raise ValueError(
                                "both keypoint_logits and keypoint_proposals should not be None when not in training mode"
                            )

                        if feature_logits is not None:

                            points_probs, points_scores = point_inference(feature_logits,point_proposals)
                            for keypoint_prob, kps, r in zip(points_probs, points_scores, result):
                                r["points"] = keypoint_prob
                                r["points_scores"] = kps

                print(f'loss_point:{loss_point}')
                losses.update(loss_point)
                print(f'losses:{losses}')


        if self.has_arc() and self.detect_arc:
            print(f'roi_heads forward has_arc()!!!!')
            # print(f'labels:{labels}')
            arc_proposals = [p["boxes"] for p in result]
            print(f'boxes_proposals:{len(arc_proposals)}')
            print(f'boxes_proposals:{len(arc_proposals)}')

            # if line_proposals is None or len(line_proposals) == 0:
            #     # è¿åç©ºç¹å¾æèè·³è¿è¯¥é¨åè®¡ç®
            #     return torch.empty(0, C, H, W).to(features['0'].device)

            if self.training:
                # during training, only focus on positive boxes
                num_images = len(proposals)
                print(f'num_images:{num_images}')
                arc_proposals = []
                arc_pos_matched_idxs = []
                if matched_idxs is None:
                    raise ValueError("if in trainning, matched_idxs should not be None")
                for img_id in range(num_images):
                    arc_pos=torch.where(labels[img_id] ==3)[0]
                    arc_proposals.append(proposals[img_id][arc_pos])
                    arc_pos_matched_idxs.append(matched_idxs[img_id][arc_pos])
            else:
                if targets is not None:

                    num_images = len(proposals)
                    arc_proposals = []

                    arc_pos_matched_idxs = []
                    print(f'val num_images:{num_images}')
                    if matched_idxs is None:
                        raise ValueError("if in trainning, matched_idxs should not be None")

                    for img_id in range(num_images):
                        arc_pos = torch.where(labels[img_id] == 3)[0]
                        arc_proposals.append(proposals[img_id][arc_pos])
                        arc_pos_matched_idxs.append(matched_idxs[img_id][arc_pos])

                else:
                    arc_pos_matched_idxs = None

            arc_proposals_valid=self.check_proposals(arc_proposals)

            if arc_proposals_valid:


                feature_logits = self.arc_forward1(features, image_shapes, arc_proposals)

                loss_arc=None

                if self.training:

                    if targets is None or arc_pos_matched_idxs is None:
                        raise ValueError("both targets and pos_matched_idxs should not be None when in training mode")

                    gt_arcs = [t["arc_mask"] for t in targets if "arc_mask" in t]

                    print(f'gt_arcs:{gt_arcs[0].shape}')
                    h, w = targets[0]["img_size"]
                    img_size = h

                    # gt_arcs_tensor = torch.zeros(0, 0)
                    # if len(gt_arcs) > 0:
                    #     gt_arcs_tensor = torch.cat(gt_arcs)
                    #     print(f'gt_arcs_tensor:{gt_arcs_tensor.shape}')
                    #
                    # if gt_arcs_tensor.shape[0] > 0:
                    #     print(f'start to compute point_loss')
                    if len(gt_arcs) > 0 and feature_logits is not None:
                        loss_arc = compute_mask_loss(feature_logits, arc_proposals, gt_arcs, arc_pos_matched_idxs)

                    if loss_arc is None:
                        print(f'loss_arc is None111')
                        loss_arc = torch.tensor(0.0, device=device)

                    loss_arc = {"loss_arc": loss_arc}

                else:
                    if targets is not None:
                        h, w = targets[0]["img_size"]
                        img_size = h
                        gt_arcs = [t["arc_mask"] for t in targets if "arc_mask" in t]

                        print(f'gt_arcs:{gt_arcs[0].shape}')
                        h, w = targets[0]["img_size"]
                        img_size = h

                        # gt_arcs_tensor = torch.zeros(0, 0)
                        # if len(gt_arcs) > 0:
                        #     gt_arcs_tensor = torch.cat(gt_arcs)
                        #     print(f'gt_arcs_tensor:{gt_arcs_tensor.shape}')

                        # if gt_arcs_tensor.shape[0] > 0 and feature_logits is not None:
                        #     print(f'start to compute arc_loss')

                        if len(gt_arcs) > 0 and feature_logits is not None:
                            print(f'start to compute arc_loss')
                            loss_arc = compute_mask_loss(feature_logits, arc_proposals, gt_arcs, arc_pos_matched_idxs)


                        if loss_arc is None:
                            print(f'loss_arc is None111')
                            loss_arc = torch.tensor(0.0, device=device)

                        loss_arc = {"loss_arc": loss_arc}


                    else:
                        loss_arc = {}
                        if feature_logits is None or arc_proposals is None:
                            # raise ValueError(
                            #     "both arc_feature_logits and arc_proposals should not be None when not in training mode"
                            # )

                            print(f'error :both arc_feature_logits and arc_proposals should not be None when not in training mode"')
                            pass

                        if feature_logits is not None and arc_proposals is not None:

                            arcs_probs, arcs_scores, arcs_point = arc_inference(feature_logits,arc_proposals, th=0)
                            for keypoint_prob, kps, kp, r in zip(arcs_probs, arcs_scores, arcs_point, result):
                                # r["arcs"] = keypoint_prob
                                r["arcs"] = feature_logits
                                r["arcs_scores"] = kps
                                r["arcs_point"] = feature_logits


                # print(f'loss_point:{loss_point}')
                losses.update(loss_arc)
                print(f'losses:{losses}')

        if self.has_ins and self.detect_circle:
            print(f'roi_heads forward has_circle()!!!!')
            # print(f'labels:{labels}')
            circle_proposals = [p["boxes"] for p in result]
            print(f'boxes_proposals:{len(circle_proposals)}')

            # if line_proposals is None or len(line_proposals) == 0:
            #     # è¿åç©ºç¹å¾æèè·³è¿è¯¥é¨åè®¡ç®
            #     return torch.empty(0, C, H, W).to(features['0'].device)

            if self.training:
                # during training, only focus on positive boxes
                num_images = len(proposals)
                print(f'num_images:{num_images}')
                circle_proposals = []
                circle_pos_matched_idxs = []
                if matched_idxs is None:
                    raise ValueError("if in trainning, matched_idxs should not be None")
                for img_id in range(num_images):
                    circle_pos = torch.where(labels[img_id] == 4)[0]
                    circle_proposals.append(proposals[img_id][circle_pos])
                    circle_pos_matched_idxs.append(matched_idxs[img_id][circle_pos])
            else:
                if targets is not None:

                    num_images = len(proposals)
                    circle_proposals = []

                    circle_pos_matched_idxs = []
                    print(f'val num_images:{num_images}')
                    if matched_idxs is None:
                        raise ValueError("if in trainning, matched_idxs should not be None")

                    for img_id in range(num_images):
                        circle_pos = torch.where(labels[img_id] == 4)[0]
                        circle_proposals.append(proposals[img_id][circle_pos])
                        circle_pos_matched_idxs.append(matched_idxs[img_id][circle_pos])

                else:
                    pos_matched_idxs = None

            # circle_proposals_tensor=torch.cat(circle_proposals)

            circle_proposals_valid = self.check_proposals(circle_proposals)

            if  circle_proposals_valid:


                print(f'features from backbone:{features['0'].shape}')
                feature_logits = self.ins_forward1(features, image_shapes, circle_proposals)

                loss_circle = None
                loss_circle_extra=None

                if self.training:

                    if targets is None or circle_pos_matched_idxs is None:
                        raise ValueError("both targets and pos_matched_idxs should not be None when in training mode")

                    gt_circles = [t["circle_masks"] for t in targets if "circle_masks" in t]
                    gt_labels = [t["labels"] for t in targets]

                    print(f'gt_circle:{gt_circles[0].shape}')
                    h, w = targets[0]["img_size"]
                    img_size = h

                    gt_circles_tensor = torch.zeros(0, 0)
                    if len(gt_circles) > 0:
                        gt_circles_tensor = torch.cat(gt_circles)
                        print(f'gt_circles_tensor:{gt_circles_tensor.shape}')

                    if gt_circles_tensor.shape[0] > 0:
                        print(f'start to compute circle_loss')

                        loss_circle = compute_mask_loss(feature_logits, circle_proposals, gt_circles, circle_pos_matched_idxs)

                        # loss_circle_extra=compute_circle_extra_losses(feature_logits, circle_proposals, gt_circles, circle_pos_matched_idxs)

                    if loss_circle is None:
                        print(f'loss_circle is None111')
                        loss_circle = torch.tensor(0.0, device=device)

                    if loss_circle_extra is None:
                        print(f'loss_circle_extra is None111')
                        loss_circle_extra = torch.tensor(0.0, device=device)

                    loss_circle = {"loss_circle": loss_circle}
                    loss_circle_extra = {"loss_circle_extra": loss_circle_extra}

                else:
                    if targets is not None:
                        h, w = targets[0]["img_size"]
                        img_size = h
                        gt_circles = [t["circle_masks"] for t in targets if "circle_masks" in t]
                        gt_labels = [t["labels"] for t in targets]
                        gt_circles_tensor = torch.zeros(0, 0)
                        if len(gt_circles) > 0:
                            gt_circles_tensor = torch.cat(gt_circles)
                            print(f'gt_circles_tensor:{gt_circles_tensor.shape}')

                        if gt_circles_tensor.shape[0] > 0:
                            print(f'start to compute circle_loss')

                            loss_circle = compute_mask_loss(feature_logits, circle_proposals, gt_circles,
                                                            circle_pos_matched_idxs)

                            # loss_circle_extra = compute_circle_extra_losses(feature_logits, circle_proposals, gt_circles,circle_pos_matched_idxs)

                        if loss_circle is None:
                            print(f'loss_circle is None111')
                            loss_circle = torch.tensor(0.0, device=device)

                        if loss_circle_extra is None:
                            print(f'loss_circle_extra is None111')
                            loss_circle_extra = torch.tensor(0.0, device=device)

                        loss_circle = {"loss_circle": loss_circle}
                        loss_circle_extra = {"loss_circle_extra": loss_circle_extra}


                    else:
                        loss_circle = {}
                        loss_circle_extra = {}
                        if feature_logits is None or circle_proposals is None:
                            raise ValueError(
                                "both keypoint_logits and keypoint_proposals should not be None when not in training mode"
                            )

                        if feature_logits is not None:

                            circles_probs, circles_scores, circle_points = arc_inference(feature_logits,
                                                                                         circle_proposals, th=0)
                            # print(f'circles_probs:{circles_probs.shape}, circles_scores:{circles_scores.shape}')
                            proposals_per_image = [box.size(0) for box in circle_proposals]
                            print(f'circle_proposals_per_image:{proposals_per_image}')
                            feature_logits_props = []
                            start_idx = 0
                            for num_p in proposals_per_image:
                                current_features = feature_logits[start_idx:start_idx + num_p]
                                merged_feature = torch.sum(current_features, dim=0, keepdim=True)
                                feature_logits_props.append(merged_feature)
                                start_idx += num_p

                            for keypoint_prob, kps, r, f in zip(circles_probs, circles_scores, result,
                                                                feature_logits_props):
                                r["circles"] = keypoint_prob
                                r["circles_scores"] = kps
                                print(f'circles feature map:{f.shape}')
                                r["features"] = f.squeeze(0)

                print(f'loss_circle:{loss_circle}')
                print(f'loss_circle_extra:{loss_circle_extra}')
                losses.update(loss_circle)
                losses.update(loss_circle_extra)
                print(f'losses:{losses}')


        if self.has_mask():
            mask_proposals = [p["boxes"] for p in result]
            if self.training:
                if matched_idxs is None:
                    raise ValueError("if in training, matched_idxs should not be None")

                # during training, only focus on positive boxes
                num_images = len(proposals)
                mask_proposals = []
                pos_matched_idxs = []
                for img_id in range(num_images):
                    pos = torch.where(labels[img_id] > 0)[0]
                    mask_proposals.append(proposals[img_id][pos])
                    pos_matched_idxs.append(matched_idxs[img_id][pos])
            else:
                pos_matched_idxs = None

            if self.mask_roi_pool is not None:
                mask_features = self.mask_roi_pool(features, mask_proposals, image_shapes)
                mask_features = self.mask_head(mask_features)
                mask_logits = self.mask_predictor(mask_features)
            else:
                raise Exception("Expected mask_roi_pool to be not None")

            loss_mask = {}
            if self.training:
                if targets is None or pos_matched_idxs is None or mask_logits is None:
                    raise ValueError("targets, pos_matched_idxs, mask_logits cannot be None when training")

                gt_masks = [t["masks"] for t in targets]
                gt_labels = [t["labels"] for t in targets]
                rcnn_loss_mask = maskrcnn_loss(mask_logits, mask_proposals, gt_masks, gt_labels, pos_matched_idxs)
                loss_mask = {"loss_mask": rcnn_loss_mask}
            else:
                labels = [r["labels"] for r in result]
                masks_probs = maskrcnn_inference(mask_logits, labels)
                for mask_prob, r in zip(masks_probs, result):
                    r["masks"] = mask_prob

            losses.update(loss_mask)

        # keep none checks in if conditional so torchscript will conditionally
        # compile each branch
        if self.has_keypoint():
            keypoint_proposals = [p["boxes"] for p in result]
            if self.training:
                # during training, only focus on positive boxes
                num_images = len(proposals)
                keypoint_proposals = []
                pos_matched_idxs = []
                if matched_idxs is None:
                    raise ValueError("if in trainning, matched_idxs should not be None")

                for img_id in range(num_images):
                    pos = torch.where(labels[img_id] > 0)[0]
                    keypoint_proposals.append(proposals[img_id][pos])
                    pos_matched_idxs.append(matched_idxs[img_id][pos])
            else:
                pos_matched_idxs = None

            keypoint_features = self.line_roi_pool(features, keypoint_proposals, image_shapes)

            keypoint_features = self.line_head(keypoint_features)
            keypoint_logits = self.line_predictor(keypoint_features)

            loss_keypoint = {}
            if self.training:
                if targets is None or pos_matched_idxs is None:
                    raise ValueError("both targets and pos_matched_idxs should not be None when in training mode")

                gt_keypoints = [t["keypoints"] for t in targets]
                rcnn_loss_keypoint = keypointrcnn_loss(
                    keypoint_logits, keypoint_proposals, gt_keypoints, pos_matched_idxs
                )
                loss_keypoint = {"loss_keypoint": rcnn_loss_keypoint}
            else:
                if keypoint_logits is None or keypoint_proposals is None:
                    raise ValueError(
                        "both keypoint_logits and keypoint_proposals should not be None when not in training mode"
                    )

                keypoints_probs, lines_scores = keypointrcnn_inference(keypoint_logits, keypoint_proposals)
                for keypoint_prob, kps, r in zip(keypoints_probs, lines_scores, result):
                    r["keypoints"] = keypoint_prob
                    r["keypoints_scores"] = kps
            losses.update(loss_keypoint)

        return result, losses

    def check_proposals(self, proposals):
        valid = True
        for proposal in proposals:
            # print(f'per circle_proposal:{circle_proposal.shape}')
            if proposal.shape[0] == 0:
                valid = False
        return valid

    def line_forward1(self, features, image_shapes, line_proposals):
        print(f'line_proposals:{len(line_proposals)}')
        # cs_features= features['0']
        # print(f'features-0:{features['0'].shape}')
        cs_features = self.channel_compress(features['0'])
        filtered_proposals = [proposal for proposal in line_proposals if proposal.shape[0] > 0]
        if len(filtered_proposals) > 0:
            filtered_proposals_tensor = torch.cat(filtered_proposals)
            print(f'filtered_proposals_tensor:{filtered_proposals_tensor.shape}')
        line_proposals_tensor = torch.cat(line_proposals)
        print(f'line_proposals_tensor:{line_proposals_tensor.shape}')
        roi_features = features_align(cs_features, line_proposals, image_shapes)
        if roi_features is not None:
            print(f'line_features from align:{roi_features.shape}')
        feature_logits = self.line_head(roi_features)
        print(f'feature_logits from line_head:{feature_logits.shape}')
        return feature_logits

    def line_forward2(self, features, image_shapes, line_proposals):
        print(f'line_proposals:{len(line_proposals)}')
        # cs_features= features['0']
        # print(f'features-0:{features['0'].shape}')
        # cs_features = self.channel_compress(features['0'])
        cs_features=features['0']
        filtered_proposals = [proposal for proposal in line_proposals if proposal.shape[0] > 0]

        if len(filtered_proposals) > 0:
            filtered_proposals_tensor = torch.cat(filtered_proposals)
            print(f'filtered_proposals_tensor:{filtered_proposals_tensor.shape}')
            line_proposals=filtered_proposals
        line_proposals_tensor = torch.cat(line_proposals)
        print(f'line_proposals_tensor:{line_proposals_tensor.shape}')

        feature_logits = self.line_head(cs_features)
        print(f'feature_logits from line_head:{feature_logits.shape}')

        roi_features = features_align(feature_logits, line_proposals, image_shapes)
        if roi_features is not None:
            print(f'roi_features from align:{roi_features.shape}')
        return roi_features

    def line_forward3(self, features, image_shapes, line_proposals):
        print(f'line_proposals:{len(line_proposals)}')
        # cs_features= features['0']
        # print(f'features-0:{features['0'].shape}')
        # cs_features = self.channel_compress(features['0'])
        cs_features=features['0']

        # cs_features = features
        # filtered_proposals = [proposal for proposal in line_proposals if proposal.shape[0] > 0]
        #
        # if len(filtered_proposals) > 0:
        #     filtered_proposals_tensor = torch.cat(filtered_proposals)
        #     print(f'filtered_proposals_tensor:{filtered_proposals_tensor.shape}')
        #     line_proposals=filtered_proposals
        # line_proposals_tensor = torch.cat(line_proposals)
        # print(f'line_proposals_tensor:{line_proposals_tensor.shape}')

        feature_logits = self.line_predictor(cs_features)
        print(f'feature_logits from line_head:{feature_logits.shape}')

        roi_features = features_align(feature_logits, line_proposals, image_shapes)
        if roi_features is not None:
            print(f'roi_features from align:{roi_features.shape}')
        return roi_features

    def point_forward1(self, features, image_shapes, proposals):
        print(f'point_proposals:{len(proposals)}')
        # cs_features= features['0']
        # print(f'features-0:{features['0'].shape}')
        # cs_features = self.channel_compress(features['0'])
        cs_features=features['0']
        # filtered_proposals = [proposal for proposal in proposals if proposal.shape[0] > 0]
        #
        # if len(filtered_proposals) > 0:
        #     filtered_proposals_tensor = torch.cat(filtered_proposals)
        #     print(f'filtered_proposals_tensor:{filtered_proposals_tensor.shape}')
        #     proposals=filtered_proposals
        # point_proposals_tensor = torch.cat(proposals)
        # print(f'point_proposals_tensor:{point_proposals_tensor.shape}')

        feature_logits = self.point_predictor(cs_features)
        print(f'feature_logits from line_head:{feature_logits.shape}')

        roi_features = features_align(feature_logits, proposals, image_shapes)
        if roi_features is not None:
            print(f'roi_features from align:{roi_features.shape}')
        return roi_features

    def ins_forward1(self, features, image_shapes, proposals):
        print(f'circle_proposals:{len(proposals)}')
        # cs_features= features['0']
        # print(f'features-0:{features['0'].shape}')
        # cs_features = self.channel_compress(features['0'])
        # cs_features=features['0']
        cs_features = features
        # filtered_proposals = [proposal for proposal in proposals if proposal.shape[0] > 0]
        #
        # if len(filtered_proposals) > 0:
        #     filtered_proposals_tensor = torch.cat(filtered_proposals)
        #     print(f'filtered_proposals_tensor:{filtered_proposals_tensor.shape}')
        #     proposals=filtered_proposals
        # point_proposals_tensor = torch.cat(proposals)
        # print(f'point_proposals_tensor:{point_proposals_tensor.shape}')

        feature_logits = self.ins_head(cs_features)
        print(f'feature_logits from circle_head:{feature_logits.shape}')

        roi_features = features_align(feature_logits, proposals, image_shapes)
        if roi_features is not None:
            print(f'roi_features from align:{roi_features.shape}')
        return roi_features


    def arc_forward1(self, features, image_shapes, proposals):
        print(f'arc_proposals:{len(proposals)}')
        # cs_features= features['0']
        # print(f'features-0:{features['0'].shape}')
        # cs_features = self.channel_compress(features['0'])
        # cs_features=features['0']
        cs_features = features
        # filtered_proposals = [proposal for proposal in proposals if proposal.shape[0] > 0]
        #
        # if len(filtered_proposals) > 0:
        #     filtered_proposals_tensor = torch.cat(filtered_proposals)
        #     print(f'filtered_proposals_tensor:{filtered_proposals_tensor.shape}')
        #     proposals=filtered_proposals
        # point_proposals_tensor = torch.cat(proposals)
        # print(f'point_proposals_tensor:{point_proposals_tensor.shape}')

        feature_logits = self.arc_predictor(cs_features)
        print(f'feature_logits from arc_head:{feature_logits.shape}')

        roi_features = features_align(feature_logits, proposals, image_shapes)
        if roi_features is not None:
            print(f'roi_features from align:{roi_features.shape}')
        return roi_features