ssm

we1pingyu · we1pingyu · commit 52c5bd39bc0f · 2020-12-04T16:09:17.000+08:00
diff --git a/.gitignore b/.gitignore
@@ -22,6 +22,7 @@ data/*
 */**/**/*.pyc
 */**/**/**/*.pyc
 */**/**/**/**/*.pyc
+vis/
 aten/build/
 aten/src/ATen/Config.h
 aten/src/ATen/cuda/CUDAConfig.h
diff --git a/detection/frcnn_feature.py b/detection/frcnn_feature.py
@@ -18,6 +18,7 @@
 from torch.jit.annotations import Optional, List, Dict, Tuple
 from torchvision.ops import boxes as box_ops
 from torchvision.models.utils import load_state_dict_from_url
+import torch
 
 model_urls = {
     'fasterrcnn_resnet50_fpn_coco':
@@ -63,8 +64,81 @@ def _fastrcnn_loss(class_logits, box_regression, labels, regression_targets):
     return classification_loss, box_loss
 
 
+def judge_y(score):
+    '''return :
+    y:np.array len(score)
+    '''
+    y = []
+    for s in score:
+        if s == 1 or torch.log(s) > torch.log(1 - s):
+            y.append(1)
+        else:
+            y.append(-1)
+    return y
+
+
 class RoIHeads(_RoIHeads):
-    def forward(self, features, proposals, image_shapes, targets=None):
+
+    def ssm_postprocess_detections(self, class_logits, box_regression, proposals, image_shapes):
+        device = class_logits.device
+        num_classes = class_logits.shape[-1]
+
+        boxes_per_image = [len(boxes_in_image) for boxes_in_image in proposals]
+        pred_boxes = self.box_coder.decode(box_regression, proposals)
+
+        pred_scores = F.softmax(class_logits, -1)
+
+        # split boxes and scores per image
+        pred_boxes = pred_boxes.split(boxes_per_image, 0)
+        pred_scores = pred_scores.split(boxes_per_image, 0)
+        al_idx = 0
+        all_boxes = torch.empty([0, 4]).cuda()
+        all_scores = torch.tensor([]).cuda()
+        all_labels = []
+        CONF_THRESH = 0.1  # bigger leads more active learning samples
+        for boxes, scores, image_shape in zip(pred_boxes, pred_scores, image_shapes):
+            boxes = box_ops.clip_boxes_to_image(boxes, image_shape)
+            # create labels for each prediction
+            labels = torch.arange(num_classes, device=device)
+            labels = labels.view(1, -1).expand_as(scores)
+
+            # remove predictions with the background label
+            boxes = boxes[:, 1:]
+            scores = scores[:, 1:]
+            labels = labels[:, 1:]
+            if torch.max(scores) < CONF_THRESH:
+                al_idx = 1
+                continue
+            for cls_ind in range(num_classes - 1):
+                cls_boxes = boxes[:, cls_ind]
+                cls_scores = scores[:, cls_ind]
+                cls_labels = labels[:, cls_ind]
+                # batch everything, by making every class prediction be a separate instance
+                cls_boxes = cls_boxes.reshape(-1, 4)
+                cls_scores = cls_scores.flatten()
+                cls_labels = cls_labels.flatten()
+
+                # remove low scoring boxes
+
+                # non-maximum suppression, independently done per class
+                keep = box_ops.batched_nms(cls_boxes, cls_scores, cls_labels, self.nms_thresh)
+                # keep only topk scoring predictions
+                keep = keep[:self.detections_per_img]
+                cls_boxes, cls_scores, cls_labels = cls_boxes[keep], cls_scores[keep], cls_labels[keep]
+                inds = torch.nonzero(cls_scores > self.score_thresh).squeeze(1)
+                if len(inds) == 0:
+                    continue
+                for j in inds:
+                    # boxes, scores, labels = boxes[inds], scores[inds], labels[inds]
+
+                    all_boxes = torch.cat((all_boxes, cls_boxes[j].unsqueeze(0)), 0)
+                    k = keep[j]
+                    all_scores = torch.cat((all_scores, scores[k].unsqueeze(0)), 0)
+                    all_labels.append(judge_y(scores[k]))
+        # all_scores = [torch.cat(all_scores, 1)]
+        return [all_boxes], [all_scores], [all_labels], al_idx
+
+    def forward(self, features, proposals, image_shapes, ssm, targets=None):
         # type: (Dict[str, Tensor], List[Tensor], List[Tuple[int, int]], Optional[List[Dict[str, Tensor]]])
         """
         Arguments:
@@ -101,106 +175,31 @@ def forward(self, features, proposals, image_shapes, targets=None):
                 "loss_box_reg": loss_box_reg
             }
         else:
-            boxes, scores, labels = self.postprocess_detections(class_logits, box_regression, proposals, image_shapes)
-            num_images = len(boxes)
-            for i in range(num_images):
-                result.append(
-                    {
-                        "boxes": boxes[i],
-                        "labels": labels[i],
-                        "scores": scores[i],
-                    }
-                )
-
-        if self.has_mask():
-            mask_proposals = [p["boxes"] for p in result]
-            if self.training:
-                assert matched_idxs is not None
-                # during training, only focus on positive boxes
-                num_images = len(proposals)
-                mask_proposals = []
-                pos_matched_idxs = []
-                for img_id in range(num_images):
-                    pos = torch.nonzero(labels[img_id] > 0).squeeze(1)
-                    mask_proposals.append(proposals[img_id][pos])
-                    pos_matched_idxs.append(matched_idxs[img_id][pos])
-            else:
-                pos_matched_idxs = None
-
-            if self.mask_roi_pool is not None:
-                mask_features = self.mask_roi_pool(features, mask_proposals, image_shapes)
-                mask_features = self.mask_head(mask_features)
-                mask_logits = self.mask_predictor(mask_features)
-            else:
-                mask_logits = torch.tensor(0)
-                raise Exception("Expected mask_roi_pool to be not None")
-
-            loss_mask = {}
-            if self.training:
-                assert targets is not None
-                assert pos_matched_idxs is not None
-                assert mask_logits is not None
-
-                gt_masks = [t["masks"] for t in targets]
-                gt_labels = [t["labels"] for t in targets]
-                rcnn_loss_mask = maskrcnn_loss(
-                    mask_logits, mask_proposals,
-                    gt_masks, gt_labels, pos_matched_idxs)
-                loss_mask = {
-                    "loss_mask": rcnn_loss_mask
-                }
+            if ssm:
+                boxes, scores, labels, al = self.ssm_postprocess_detections(class_logits, box_regression,
+                                                                            proposals, image_shapes)
+                num_images = len(boxes)
+                for i in range(num_images):
+                    result.append(
+                        {
+                            "boxes": boxes[i],
+                            "labels": labels[i],
+                            "scores": scores[i],
+                            'al': al,
+                        }
+                    )
             else:
-                labels = [r["labels"] for r in result]
-                masks_probs = maskrcnn_inference(mask_logits, labels)
-                for mask_prob, r in zip(masks_probs, result):
-                    r["masks"] = mask_prob
-
-            losses.update(loss_mask)
-
-        # keep none checks in if conditional so torchscript will conditionally
-        # compile each branch
-        if self.keypoint_roi_pool is not None and self.keypoint_head is not None \
-                and self.keypoint_predictor is not None:
-            keypoint_proposals = [p["boxes"] for p in result]
-            if self.training:
-                # during training, only focus on positive boxes
-                num_images = len(proposals)
-                keypoint_proposals = []
-                pos_matched_idxs = []
-                assert matched_idxs is not None
-                for img_id in range(num_images):
-                    pos = torch.nonzero(labels[img_id] > 0).squeeze(1)
-                    keypoint_proposals.append(proposals[img_id][pos])
-                    pos_matched_idxs.append(matched_idxs[img_id][pos])
-            else:
-                pos_matched_idxs = None
-
-            keypoint_features = self.keypoint_roi_pool(features, keypoint_proposals, image_shapes)
-            keypoint_features = self.keypoint_head(keypoint_features)
-            keypoint_logits = self.keypoint_predictor(keypoint_features)
-
-            loss_keypoint = {}
-            if self.training:
-                assert targets is not None
-                assert pos_matched_idxs is not None
-
-                gt_keypoints = [t["keypoints"] for t in targets]
-                rcnn_loss_keypoint = keypointrcnn_loss(
-                    keypoint_logits, keypoint_proposals,
-                    gt_keypoints, pos_matched_idxs)
-                loss_keypoint = {
-                    "loss_keypoint": rcnn_loss_keypoint
-                }
-            else:
-                assert keypoint_logits is not None
-                assert keypoint_proposals is not None
-
-                keypoints_probs, kp_scores = keypointrcnn_inference(keypoint_logits, keypoint_proposals)
-                for keypoint_prob, kps, r in zip(keypoints_probs, kp_scores, result):
-                    r["keypoints"] = keypoint_prob
-                    r["keypoints_scores"] = kps
-
-            losses.update(loss_keypoint)
+                boxes, scores, labels = self.postprocess_detections(class_logits, box_regression,
+                                                                    proposals, image_shapes)
+                num_images = len(boxes)
+                for i in range(num_images):
+                    result.append(
+                        {
+                            "boxes": boxes[i],
+                            "labels": labels[i],
+                            "scores": scores[i],
+                        }
+                    )
 
         return result, losses
 
@@ -561,9 +560,7 @@ def __init__(self, backbone, num_classes=None,
             box_predictor = FastRCNNPredictor(
                 representation_size,
                 num_classes)
-
-        roi_heads = RoIHeads(
-            # Box
+        roi_heads = RoIHeads(  # Box
             box_roi_pool, box_head, box_predictor,
             box_fg_iou_thresh, box_bg_iou_thresh,
             box_batch_size_per_image, box_positive_fraction,
@@ -575,9 +572,12 @@ def __init__(self, backbone, num_classes=None,
         if image_std is None:
             image_std = [0.229, 0.224, 0.225]
         transform = GeneralizedRCNNTransform(min_size, max_size, image_mean, image_std)
-
+        self.ssm = False
         super(FasterRCNN, self).__init__(backbone, rpn, roi_heads, transform)
 
+    def ssm_mode(self, ssm):
+        self.ssm = ssm
+
     def forward(self, images, targets=None):
         # type: (List[Tensor], Optional[List[Dict[str, Tensor]]])
         """
@@ -603,7 +603,8 @@ def forward(self, images, targets=None):
         if isinstance(features, torch.Tensor):
             features = OrderedDict([('0', features)])
         proposals, proposal_losses = self.rpn(images, features, targets)
-        detections, detector_losses = self.roi_heads(features, proposals, images.image_sizes, targets)
+        detections, detector_losses = self.roi_heads(features, proposals, images.image_sizes, self.ssm, targets)
+        # if not len(detections) == 0:
         detections = self.transform.postprocess(detections, images.image_sizes, original_image_sizes)
 
         losses = {}
@@ -627,7 +628,6 @@ def fasterrcnn_resnet50_fpn_feature(pretrained=False, progress=True,
     backbone = resnet_fpn_backbone('resnet50', pretrained_backbone)
     model = FRCNN_Feature(backbone, num_classes, **kwargs)
     if pretrained:
-        print(model_urls.keys())
         state_dict = load_state_dict_from_url(model_urls['fasterrcnn_resnet50_fpn_coco'],
                                               progress=progress)
         model.load_state_dict(state_dict)
diff --git a/detection/group_by_aspect_ratio.py b/detection/group_by_aspect_ratio.py
@@ -190,6 +190,6 @@ def create_aspect_ratio_groups(dataset, k=0):
     # count number of elements per group
     counts = np.unique(groups, return_counts=True)[1]
     fbins = [0] + bins + [np.inf]
-    print("Using {} as bins for aspect ratio quantization".format(fbins))
-    print("Count of instances per bin: {}".format(counts))
+    # print("Using {} as bins for aspect ratio quantization".format(fbins))
+    # print("Count of instances per bin: {}".format(counts))
     return groups
diff --git a/ll4al/main.py b/ll4al/main.py
@@ -52,10 +52,10 @@
     T.Normalize([0.4914, 0.4822, 0.4465], [0.2023, 0.1994, 0.2010])
     # T.Normalize((0.5071, 0.4867, 0.4408), (0.2675, 0.2565, 0.2761)) # CIFAR-100
 ])
-
-cifar10_train = CIFAR10('/home/omnisky/ywp/data', train=True, download=True, transform=train_transform)
-cifar10_unlabeled = CIFAR10('/home/omnisky/ywp/data', train=True, download=True, transform=test_transform)
-cifar10_test = CIFAR10('/home/omnisky/ywp/data', train=False, download=True, transform=test_transform)
+#
+# cifar10_train = CIFAR10('/home/omnisky/ywp/data', train=True, download=True, transform=train_transform)
+# cifar10_unlabeled = CIFAR10('/home/omnisky/ywp/data', train=True, download=True, transform=test_transform)
+# cifar10_test = CIFAR10('/home/omnisky/ywp/data', train=False, download=True, transform=test_transform)
 
 
 ##
diff --git a/ll_train.py b/ll_train.py
@@ -216,15 +216,14 @@ def main(args):
 
         # Update the labeled dataset and the unlabeled dataset, respectively
         labeled_set += list(torch.tensor(subset)[arg][int(-0.05 * num_images):].numpy())
-        unlabeled_set = list(torch.tensor(subset)[arg][:int(-0.05 * num_images)].numpy()) + \
-                        unlabeled_set[int(0.2 * num_images):]
+        unlabeled_set = list(torch.tensor(subset)[arg][:int(-0.05 * num_images)].numpy()) + unlabeled_set
 
         # Create a new dataloader for the updated labeled dataset
         train_sampler = SubsetRandomSampler(labeled_set)
 
-    total_time = time.time() - start_time
-    total_time_str = str(datetime.timedelta(seconds=int(total_time)))
-    print('Training time {}'.format(total_time_str))
+        total_time = time.time() - start_time
+        total_time_str = str(datetime.timedelta(seconds=int(total_time)))
+        print('Training time {}'.format(total_time_str))
 
 
 if __name__ == "__main__":
diff --git a/random_train.py b/random_train.py
@@ -119,7 +119,6 @@ def main(args):
     indices = list(range(num_images))
     random.shuffle(indices)
     labeled_set = indices[:int(num_images * 0.1)]
-    print(labeled_set)
     unlabeled_set = indices[int(num_images * 0.1):]
     train_sampler = SubsetRandomSampler(labeled_set)
     test_sampler = torch.utils.data.SequentialSampler(dataset_test)
@@ -158,15 +157,15 @@ def main(args):
             train_one_epoch(task_model, task_optimizer, data_loader, device, cycle, epoch, args.print_freq)
             task_lr_scheduler.step()
             # evaluate after pre-set epoch
-            if (epoch + 1) == args.task_epochs or (epoch + 1) == args.total_epochs:
+            if (epoch + 1) == args.total_epochs:
                 if 'coco' in args.dataset:
                     coco_evaluate(task_model, data_loader_test)
                 elif 'voc' in args.dataset:
                     voc_evaluate(task_model, data_loader_test)
         random.shuffle(unlabeled_set)
         # Update the labeled dataset and the unlabeled dataset, respectively
-        labeled_set += unlabeled_set[int(0.05 * num_images):]
-        unlabeled_set = unlabeled_set[:int(0.05 * num_images)]
+        labeled_set += unlabeled_set[:int(0.05 * num_images)]
+        unlabeled_set = unlabeled_set[int(0.05 * num_images):]
 
         # Create a new dataloader for the updated labeled dataset
         train_sampler = SubsetRandomSampler(labeled_set)
@@ -188,15 +187,15 @@ def main(args):
     parser.add_argument('--device', default='cuda', help='device')
     parser.add_argument('-b', '--batch-size', default=2, type=int,
                         help='images per gpu, the total batch size is $NGPU x batch_size')
-    parser.add_argument('--task_epochs', default=15, type=int, metavar='N',
+    parser.add_argument('--task_epochs', default=20, type=int, metavar='N',
                         help='number of total epochs to run')
-    parser.add_argument('--total_epochs', default=15, type=int, metavar='N',
+    parser.add_argument('--total_epochs', default=20, type=int, metavar='N',
                         help='number of total epochs to run')
     parser.add_argument('--cycles', default=7, type=int, metavar='N',
                         help='number of cycles epochs to run')
     parser.add_argument('-j', '--workers', default=4, type=int, metavar='N',
                         help='number of data loading workers (default: 4)')
-    parser.add_argument('--lr', default=0.005, type=float,
+    parser.add_argument('--lr', default=0.0025, type=float,
                         help='initial learning rate, 0.02 is the default value for training '
                              'on 8 gpus and 2 images_per_gpu')
     parser.add_argument('--momentum', default=0.9, type=float, metavar='M',
@@ -205,7 +204,7 @@ def main(args):
                         metavar='W', help='weight decay (default: 1e-4)',
                         dest='weight_decay')
     parser.add_argument('--lr-step-size', default=8, type=int, help='decrease lr every step-size epochs')
-    parser.add_argument('--lr-steps', default=[10], nargs='+', type=int, help='decrease lr every step-size epochs')
+    parser.add_argument('--lr-steps', default=[16, 19], nargs='+', type=int, help='decrease lr every step-size epochs')
     parser.add_argument('--lr-gamma', default=0.1, type=float, help='decrease lr by a factor of lr-gamma')
     parser.add_argument('--print-freq', default=1000, type=int, help='print frequency')
     parser.add_argument('--output-dir', default=None, help='path where to save')
diff --git a/ssm/ssm_helper.py b/ssm/ssm_helper.py
diff --git a/ssm_train.py b/ssm_train.py