better docs

b83b32a2 · Ross Girshick · f8563aef · b83b32a2 · b83b32a2
Commit b83b32a2 authored 10 years ago by Ross Girshick
--- a/examples/caffenet.yml
+++ b/examples/caffenet.yml
+TRAIN:
+  SCALES: !!python/tuple [480, 576, 688, 864, 1200]
+  MAX_SIZE: 2000
+  SNAPSHOT_INFIX: "multiscale"
+TEST:
+  SCALES: !!python/tuple [480, 576, 688, 864, 1200]
+  MAX_SIZE: 2000
--- a/fast_rcnn_config.py
+++ b/fast_rcnn_config.py
@@ -5,6 +5,17 @@
 # Written by Ross Girshick
 # --------------------------------------------------------

+#
+# README
+#
+# This file specifies default config options for Fast R-CNN. You should not
+# change values in this file. Instead, you should write a config YAML file
+# and use cfg_from_file(yaml_file) to load it and override the default options.
+#
+# - See tools/{train,test}_net.py for example code that uses cfg_from_file().
+# - See examples/caffenet.yml for an example YAML config override file.
+#
+
 import os
 import sys
 import numpy as np
@@ -21,49 +32,68 @@ __C = edict()
 cfg = __C

 #
-# Training
+# Training options
 #

 __C.TRAIN                 = edict()

-# SCALES          = (480, 576, 688, 864, 1200)
+# Scales to use during training (can list multiple scales)
+# Each scale is the pixel size of an image's shortest side
 __C.TRAIN.SCALES          = (600,)

-# Max pixel size of a scaled input image
+# Max pixel size of the longest side of a scaled input image
 __C.TRAIN.MAX_SIZE        = 1000

-# Images per batch
+# Images to use per minibatch
 __C.TRAIN.IMS_PER_BATCH   = 2

-# Minibatch size
+# Minibatch size (number of regions of interest [ROIs])
 __C.TRAIN.BATCH_SIZE      = 128

-# Fraction of minibatch that is foreground labeled (class > 0)
+# Fraction of minibatch that is labeled foreground (i.e. class > 0)
 __C.TRAIN.FG_FRACTION     = 0.25

 # Overlap threshold for a ROI to be considered foreground (if >= FG_THRESH)
 __C.TRAIN.FG_THRESH       = 0.5

 # Overlap threshold for a ROI to be considered background (class = 0 if
-# overlap in [0.1, 0.5))
+# overlap in [LO, HI))
 __C.TRAIN.BG_THRESH_HI    = 0.5
 __C.TRAIN.BG_THRESH_LO    = 0.1

 # Use horizontally-flipped images during training?
 __C.TRAIN.USE_FLIPPED     = True

+# Overlap required between a ROI and ground-truth box in order for that ROI to
+# be used as a bounding-box regression training example
 __C.TRAIN.BBOX_THRESH     = 0.5
+
+# Iterations between snapshots
 __C.TRAIN.SNAPSHOT_ITERS  = 10000
+
+# solver.prototxt specifies the snapshot path prefix, this adds an optional
+# infix to yield the path: <prefix>[_<infix>]_iters_XYZ.caffemodel
 __C.TRAIN.SNAPSHOT_INFIX  = ''

 #
-# Testing
+# Testing options
 #

 __C.TEST            = edict()
+
+# Scales to use during testing (can list multiple scales)
+# Each scale is the pixel size of an image's shortest side
 __C.TEST.SCALES     = (600,)
+
+# Max pixel size of the longest side of a scaled input image
 __C.TEST.MAX_SIZE   = 1000
+
+# Overlap threshold used for non-maximum suppression (suppress boxes with
+# IoU >= this threshold)
 __C.TEST.NMS        = 0.3
+
+# Experimental: use binary logistic regression scores instead of K-way softmax
+# scores when testing
 __C.TEST.BINARY     = False

 #
@@ -76,15 +106,21 @@ __C.PIXEL_MEANS     = np.array([[[102.9801, 115.9465, 122.7717]]])

 # Stride in input image pixels at ROI pooling level (network specific)
 # 16 is true for {Alex,Caffe}Net, VGG_CNN_M_1024, and VGG16
+# If your network has a different stride (e.g., VGG_CNN_S has stride 12)
+# make sure to override this in a config file!)
 __C.FEAT_STRIDE     = 16

-# For reproducibility [currently the caffe seed isn't fixed...so there's that]
+# For reproducibility
 __C.RNG_SEED        = 3

 # A small number that's used many times
 __C.EPS             = 1e-14

 def merge_a_into_b(a, b):
+    """
+    Merge config dictionary a into config dictionary b, clobbering the options
+    in b whenever they are also specified in a.
+    """
    if type(a) is not edict:
        return
    for k, v in a.iteritems():
@@ -108,6 +144,10 @@ def merge_a_into_b(a, b):
            b[k] = v

 def cfg_from_file(filename):
+    """
+    Load a config file and merge it into the default options specified in this
+    file.
+    """
    import yaml
    global __C
    with open(filename, 'r') as f: