Merge branch 'master' into patch-1

gadcam · web-flow · commit 2a21855fd3b6 · 2018-08-11T20:38:21.000+02:00
diff --git a/CMakeLists.txt b/CMakeLists.txt
@@ -38,7 +38,7 @@ target_link_libraries(caffe2_detectron_custom_ops caffe2_library)
 install(TARGETS caffe2_detectron_custom_ops DESTINATION lib)
 
 # Install custom GPU ops lib, if gpu is present.
-if (${CAFFE2_FOUND_CUDA})
+if (CAFFE2_USE_CUDA OR CAFFE2_FOUND_CUDA)
   # Additional -I prefix is required for CMake versions before commit (< 3.7):
   # https://github.com/Kitware/CMake/commit/7ded655f7ba82ea72a82d0555449f2df5ef38594
   list(APPEND CUDA_INCLUDE_DIRS -I${CAFFE2_INCLUDE_DIRS})
diff --git a/INSTALL.md b/INSTALL.md
@@ -69,7 +69,7 @@ Set up Python modules:
 cd $DETECTRON && make
 ```
 
-Check that Detectron tests pass (e.g. for [`SpatialNarrowAsOp test`](tests/test_spatial_narrow_as_op.py)):
+Check that Detectron tests pass (e.g. for [`SpatialNarrowAsOp test`](detectron/tests/test_spatial_narrow_as_op.py)):
 
 ```
 python2 $DETECTRON/detectron/tests/test_spatial_narrow_as_op.py
@@ -115,7 +115,7 @@ cd $DETECTRON/docker
 docker build -t detectron:c2-cuda9-cudnn7 .
 ```
 
-Run the image (e.g. for [`BatchPermutationOp test`](tests/test_batch_permutation_op.py)):
+Run the image (e.g. for [`BatchPermutationOp test`](detectron/tests/test_batch_permutation_op.py)):
 
 ```
 nvidia-docker run --rm -it detectron:c2-cuda9-cudnn7 python2 detectron/tests/test_batch_permutation_op.py
@@ -129,7 +129,7 @@ In case of Caffe2 installation problems, please read the troubleshooting section
 
 Caffe2 comes with performance [`profiling`](https://github.com/caffe2/caffe2/tree/master/caffe2/contrib/prof)
 support which you may find useful for benchmarking or debugging your operators
-(see [`BatchPermutationOp test`](tests/test_batch_permutation_op.py) for example usage).
+(see [`BatchPermutationOp test`](detectron/tests/test_batch_permutation_op.py) for example usage).
 Profiling support is not built by default and you can enable it by setting
 the `-DUSE_PROF=ON` flag when running Caffe2 CMake.
 
diff --git a/cmake/Summary.cmake b/cmake/Summary.cmake
@@ -11,9 +11,11 @@ function (detectron_print_config_summary)
   message(STATUS "  CXX flags            : ${CMAKE_CXX_FLAGS}")
   message(STATUS "  Caffe2 version       : ${CAFFE2_VERSION}")
   message(STATUS "  Caffe2 include path  : ${CAFFE2_INCLUDE_DIRS}")
-  message(STATUS "  Caffe2 found CUDA    : ${CAFFE2_FOUND_CUDA}")
-  if (${CAFFE2_FOUND_CUDA})
+  if (CAFFE2_USE_CUDA OR CAFFE2_FOUND_CUDA)
+    message(STATUS "  Caffe2 found CUDA    : True")
     message(STATUS "    CUDA version       : ${CUDA_VERSION}")
     message(STATUS "    CuDNN version      : ${CUDNN_VERSION}")
+  else()
+    message(STATUS "  Caffe2 found CUDA    : False")
   endif()
 endfunction()
diff --git a/configs/04_2018_gn_baselines/scratch_e2e_mask_rcnn_R-101-FPN_3x_gn.yaml b/configs/04_2018_gn_baselines/scratch_e2e_mask_rcnn_R-101-FPN_3x_gn.yaml
@@ -37,6 +37,7 @@ MRCNN:
   CONV_INIT: MSRAFill  # default GaussianFill
 TRAIN:
   # WEIGHTS: N/A
+  FREEZE_AT: 0
   DATASETS: ('coco_2014_train', 'coco_2014_valminusminival')
   SCALES: (800,)
   MAX_SIZE: 1333
diff --git a/configs/04_2018_gn_baselines/scratch_e2e_mask_rcnn_R-50-FPN_3x_gn.yaml b/configs/04_2018_gn_baselines/scratch_e2e_mask_rcnn_R-50-FPN_3x_gn.yaml
@@ -37,6 +37,7 @@ MRCNN:
   CONV_INIT: MSRAFill  # default GaussianFill
 TRAIN:
   # WEIGHTS: N/A
+  FREEZE_AT: 0
   DATASETS: ('coco_2014_train', 'coco_2014_valminusminival')
   SCALES: (800,)
   MAX_SIZE: 1333
diff --git a/detectron/core/config.py b/detectron/core/config.py
@@ -189,6 +189,12 @@
 # output directory
 __C.TRAIN.AUTO_RESUME = True
 
+# Training will copy TRAIN.WEIGHTS and treat it as a candidate checkpoint
+__C.TRAIN.COPY_WEIGHTS = False
+
+# Add StopGrad at a specified stage so the bottom layers are frozen
+__C.TRAIN.FREEZE_AT = 2
+
 
 # ---------------------------------------------------------------------------- #
 # Data loader options (see detectron/roi_data/loader.py for more info)
@@ -776,7 +782,7 @@
 
 
 # ---------------------------------------------------------------------------- #
-# Keyoint Mask R-CNN options ("KRCNN" = Mask R-CNN with Keypoint support)
+# Keypoint Mask R-CNN options ("KRCNN" = Mask R-CNN with Keypoint support)
 # ---------------------------------------------------------------------------- #
 __C.KRCNN = AttrDict()
 
@@ -966,6 +972,9 @@
 # Absolute and relative tolerance to use when comparing to EXPECTED_RESULTS
 __C.EXPECTED_RESULTS_RTOL = 0.1
 __C.EXPECTED_RESULTS_ATOL = 0.005
+# When the expected value specifies a mean and standard deviation, we check
+# that the actual value is within mean +/- SIGMA_TOL * std
+__C.EXPECTED_RESULTS_SIGMA_TOL = 4
 # Set to send email in case of an EXPECTED_RESULTS failure
 __C.EXPECTED_RESULTS_EMAIL = b''
 
@@ -988,7 +997,7 @@
 # If an option is removed from the code and you don't want to break existing
 # yaml configs, you can add the full config key as a string to the set below.
 # ---------------------------------------------------------------------------- #
-_DEPCRECATED_KEYS = set(
+_DEPRECATED_KEYS = set(
     {
         'FINAL_MSG',
         'MODEL.DILATION',
@@ -1189,7 +1198,7 @@ def _merge_a_into_b(a, b, stack=None):
 
 
 def _key_is_deprecated(full_key):
-    if full_key in _DEPCRECATED_KEYS:
+    if full_key in _DEPRECATED_KEYS:
         logger.warn(
             'Deprecated config key (ignoring): {}'.format(full_key)
         )
diff --git a/detectron/datasets/data/README.md b/detectron/datasets/data/README.md
@@ -51,7 +51,8 @@ VOC<year>
 |  |_ ...
 |  |_ <im-N-name>.jpg
 |_ annotations
-|  |_ voc_<year>_trainval.json
+|  |_ voc_<year>_train.json
+|  |_ voc_<year>_val.json
 |  |_ ...
 |_ VOCdevkit<year>
 ```
diff --git a/detectron/datasets/dataset_catalog.py b/detectron/datasets/dataset_catalog.py
@@ -162,11 +162,19 @@
         _ANN_FN:
             _DATA_DIR + '/coco/annotations/image_info_test-dev2015.json'
     },
-    'voc_2007_trainval': {
+    'voc_2007_train': {
         _IM_DIR:
             _DATA_DIR + '/VOC2007/JPEGImages',
         _ANN_FN:
-            _DATA_DIR + '/VOC2007/annotations/voc_2007_trainval.json',
+            _DATA_DIR + '/VOC2007/annotations/voc_2007_train.json',
+        _DEVKIT_DIR:
+            _DATA_DIR + '/VOC2007/VOCdevkit2007'
+    },
+    'voc_2007_val': {
+        _IM_DIR:
+            _DATA_DIR + '/VOC2007/JPEGImages',
+        _ANN_FN:
+            _DATA_DIR + '/VOC2007/annotations/voc_2007_val.json',
         _DEVKIT_DIR:
             _DATA_DIR + '/VOC2007/VOCdevkit2007'
     },
@@ -178,11 +186,19 @@
         _DEVKIT_DIR:
             _DATA_DIR + '/VOC2007/VOCdevkit2007'
     },
-    'voc_2012_trainval': {
+    'voc_2012_train': {
+        _IM_DIR:
+            _DATA_DIR + '/VOC2012/JPEGImages',
+        _ANN_FN:
+            _DATA_DIR + '/VOC2012/annotations/voc_2012_train.json',
+        _DEVKIT_DIR:
+            _DATA_DIR + '/VOC2012/VOCdevkit2012'
+    },
+    'voc_2012_val': {
         _IM_DIR:
             _DATA_DIR + '/VOC2012/JPEGImages',
         _ANN_FN:
-            _DATA_DIR + '/VOC2012/annotations/voc_2012_trainval.json',
+            _DATA_DIR + '/VOC2012/annotations/voc_2012_val.json',
         _DEVKIT_DIR:
             _DATA_DIR + '/VOC2012/VOCdevkit2012'
     }
diff --git a/detectron/datasets/json_dataset.py b/detectron/datasets/json_dataset.py
@@ -43,6 +43,7 @@
 from detectron.utils.timer import Timer
 import detectron.datasets.dataset_catalog as dataset_catalog
 import detectron.utils.boxes as box_utils
+import detectron.utils.segms as segm_utils
 
 logger = logging.getLogger(__name__)
 
@@ -167,8 +168,8 @@ def _add_gt_annotations(self, entry):
         width = entry['width']
         height = entry['height']
         for obj in objs:
-            # crowd regions are RLE encoded and stored as dicts
-            if isinstance(obj['segmentation'], list):
+            # crowd regions are RLE encoded
+            if segm_utils.is_poly(obj['segmentation']):
                 # Valid polygons have >= 3 points, so require >= 6 coordinates
                 obj['segmentation'] = [
                     p for p in obj['segmentation'] if len(p) >= 6
diff --git a/detectron/datasets/task_evaluation.py b/detectron/datasets/task_evaluation.py
@@ -195,6 +195,11 @@ def check_expected_results(results, atol=0.005, rtol=0.1):
     Expected results should take the form of a list of expectations, each
     specified by four elements: [dataset, task, metric, expected value]. For
     example: [['coco_2014_minival', 'box_proposal', 'AR@1000', 0.387], ...].
+
+    The expected value may also be formatted as a list [mean, std] providing
+    an empirical mean and standard deviation from which a valid range is computed
+    using cfg.EXPECTED_RESULTS_SIGMA_TOL. For example:
+    [['coco_2014_minival', 'box_proposal', 'AR@1000', [0.387, 0.001]], ...]
     """
     # cfg contains a reference set of results that we want to check against
     if len(cfg.EXPECTED_RESULTS) == 0:
@@ -206,13 +211,28 @@ def check_expected_results(results, atol=0.005, rtol=0.1):
         assert metric in results[dataset][task], \
             'Metric {} not in results'.format(metric)
         actual_val = results[dataset][task][metric]
-        err = abs(actual_val - expected_val)
-        tol = atol + rtol * abs(expected_val)
-        msg = (
-            '{} > {} > {} sanity check (actual vs. expected): '
-            '{:.3f} vs. {:.3f}, err={:.3f}, tol={:.3f}'
-        ).format(dataset, task, metric, actual_val, expected_val, err, tol)
-        if err > tol:
+        ok = False
+        if isinstance(expected_val, list):
+            assert len(expected_val) == 2, (
+                'Expected result must be in (mean, std) format'
+            )
+            mean, std = expected_val
+            lo = mean - cfg.EXPECTED_RESULTS_SIGMA_TOL * std
+            hi = mean + cfg.EXPECTED_RESULTS_SIGMA_TOL * std
+            ok = (lo < actual_val) and (actual_val < hi)
+            msg = (
+                '{} > {} > {} sanity check (actual vs. expected): '
+                '{:.3f} vs. mean={:.4f}, std={:.4}, range=({:.4f}, {:.4f})'
+            ).format(dataset, task, metric, actual_val, mean, std, lo, hi)
+        else:
+            err = abs(actual_val - expected_val)
+            tol = atol + rtol * abs(expected_val)
+            ok = (err > tol)
+            msg = (
+                '{} > {} > {} sanity check (actual vs. expected): '
+                '{:.3f} vs. {:.3f}, err={:.3f}, tol={:.3f}'
+            ).format(dataset, task, metric, actual_val, expected_val, err, tol)
+        if not ok:
             msg = 'FAIL: ' + msg
             logger.error(msg)
             if cfg.EXPECTED_RESULTS_EMAIL != '':
diff --git a/detectron/modeling/ResNet.py b/detectron/modeling/ResNet.py
@@ -88,10 +88,11 @@ def add_stage(
     return blob_in, dim_in
 
 
-def add_ResNet_convX_body(model, block_counts, freeze_at=2):
+def add_ResNet_convX_body(model, block_counts):
     """Add a ResNet body from input data up through the res5 (aka conv5) stage.
     The final res5/conv5 stage may be optionally excluded (hence convX, where
     X = 4 or 5)."""
+    freeze_at = cfg.TRAIN.FREEZE_AT
     assert freeze_at in [0, 2, 3, 4, 5]
 
     # add the stem (by default, conv1 and pool1 with bn; can support gn)
diff --git a/detectron/modeling/detector.py b/detectron/modeling/detector.py
@@ -446,7 +446,7 @@ def ConvGN(  # args in the same order of Conv()
 
         blob_out = self.SpatialGN(
             conv_blob, prefix + suffix,
-            dim_out, num_groups=group_gn,
+            dim_out, group=group_gn,  # op's arg name is "group"
             epsilon=cfg.GROUP_NORM.EPSILON,)
 
         self.gn_params.append(self.params[-1])  # add gn's bias to list
diff --git a/detectron/roi_data/rpn.py b/detectron/roi_data/rpn.py
@@ -89,12 +89,6 @@ def add_rpn_blobs(blobs, im_scales, roidb):
             (entry['gt_classes'] > 0) & (entry['is_crowd'] == 0)
         )[0]
         gt_rois = entry['boxes'][gt_inds, :] * scale
-        # TODO(rbg): gt_boxes is poorly named;
-        # should be something like 'gt_rois_info'
-        gt_boxes = blob_utils.zeros((len(gt_inds), 6))
-        gt_boxes[:, 0] = im_i  # batch inds
-        gt_boxes[:, 1:5] = gt_rois
-        gt_boxes[:, 5] = entry['gt_classes'][gt_inds]
         im_info = np.array([[im_height, im_width, scale]], dtype=np.float32)
         blobs['im_info'].append(im_info)
 
diff --git a/detectron/utils/net.py b/detectron/utils/net.py
@@ -37,6 +37,7 @@
 import detectron.utils.c2 as c2_utils
 
 logger = logging.getLogger(__name__)
+logger.setLevel(logging.INFO)
 
 
 def initialize_from_weights_file(model, weights_file, broadcast=True):
@@ -90,7 +91,7 @@ def initialize_gpu_from_weights_file(model, weights_file, gpu_id=0):
             dst_name = core.ScopedName(unscoped_param_name)
             has_momentum = src_name + '_momentum' in src_blobs
             has_momentum_str = ' [+ momentum]' if has_momentum else ''
-            logger.debug(
+            logger.info(
                 '{:s}{:} loaded from weights file into {:s}: {}'.format(
                     src_name, has_momentum_str, dst_name, src_blobs[src_name]
                     .shape
@@ -128,7 +129,7 @@ def initialize_gpu_from_weights_file(model, weights_file, gpu_id=0):
             with c2_utils.CpuScope():
                 workspace.FeedBlob(
                     '__preserve__/{:s}'.format(src_name), src_blobs[src_name])
-                logger.debug(
+                logger.info(
                     '{:s} preserved in workspace (unused)'.format(src_name))
 
 
diff --git a/detectron/utils/segms.py b/detectron/utils/segms.py
@@ -31,6 +31,18 @@
 
 import pycocotools.mask as mask_util
 
+# Type used for storing masks in polygon format
+_POLY_TYPE = list
+# Type used for storing masks in RLE format
+_RLE_TYPE = dict
+
+
+def is_poly(segm):
+    """Determine if segm is a polygon. Valid segm expected (polygon or RLE)."""
+    assert isinstance(segm, (_POLY_TYPE, _RLE_TYPE)), \
+        'Invalid segm type: {}'.format(type(segm))
+    return isinstance(segm, _POLY_TYPE)
+
 
 def flip_segms(segms, height, width):
     """Left/right flip each mask in a list of masks."""
@@ -51,12 +63,11 @@ def _flip_rle(rle, height, width):
 
     flipped_segms = []
     for segm in segms:
-        if type(segm) == list:
+        if is_poly(segm):
             # Polygon format
             flipped_segms.append([_flip_poly(poly, width) for poly in segm])
         else:
             # RLE format
-            assert type(segm) == dict
             flipped_segms.append(_flip_rle(segm, height, width))
     return flipped_segms
 
diff --git a/detectron/utils/train.py b/detectron/utils/train.py
@@ -28,6 +28,7 @@
 from __future__ import print_function
 from __future__ import unicode_literals
 
+from shutil import copyfile
 import cv2  # NOQA (Must import before importing caffe2 due to bug in cv2)
 import logging
 import numpy as np
@@ -109,6 +110,12 @@ def create_model():
             logger.info('model_final.pkl exists; no need to train!')
             return None, None, None, {'final': final_path}, output_dir
 
+        if cfg.TRAIN.COPY_WEIGHTS:
+            copyfile(
+                weights_file,
+                os.path.join(output_dir, os.path.basename(weights_file)))
+            logger.info('Copy {} to {}'.format(weights_file, output_dir))
+
         # Find the most recent checkpoint (highest iteration number)
         files = os.listdir(output_dir)
         for f in files:
diff --git a/detectron/utils/vis.py b/detectron/utils/vis.py
@@ -251,7 +251,7 @@ def vis_one_image_opencv(
 def vis_one_image(
         im, im_name, output_dir, boxes, segms=None, keypoints=None, thresh=0.9,
         kp_thresh=2, dpi=200, box_alpha=0.0, dataset=None, show_class=False,
-        ext='pdf'):
+        ext='pdf', out_when_no_box=False):
     """Visual debugging of detections."""
     if not os.path.exists(output_dir):
         os.makedirs(output_dir)
@@ -260,7 +260,7 @@ def vis_one_image(
         boxes, segms, keypoints, classes = convert_from_cls_format(
             boxes, segms, keypoints)
 
-    if boxes is None or boxes.shape[0] == 0 or max(boxes[:, 4]) < thresh:
+    if (boxes is None or boxes.shape[0] == 0 or max(boxes[:, 4]) < thresh) and not out_when_no_box:
         return
 
     dataset_keypoints, _ = keypoint_utils.get_keypoints()
@@ -281,9 +281,12 @@ def vis_one_image(
     fig.add_axes(ax)
     ax.imshow(im)
 
-    # Display in largest to smallest order to reduce occlusion
-    areas = (boxes[:, 2] - boxes[:, 0]) * (boxes[:, 3] - boxes[:, 1])
-    sorted_inds = np.argsort(-areas)
+    if boxes is None:
+        sorted_inds = [] # avoid crash when 'boxes' is None
+    else:
+        # Display in largest to smallest order to reduce occlusion
+        areas = (boxes[:, 2] - boxes[:, 0]) * (boxes[:, 3] - boxes[:, 1])
+        sorted_inds = np.argsort(-areas)
 
     mask_color_id = 0
     for i in sorted_inds:
diff --git a/projects/GN/README.md b/projects/GN/README.md
diff --git a/tools/convert_pkl_to_pb.py b/tools/convert_pkl_to_pb.py
diff --git a/tools/infer.py b/tools/infer.py
diff --git a/tools/infer_simple.py b/tools/infer_simple.py