syntax = "proto2"; package object_detection.protos; import "object_detection/protos/anchor_generator.proto"; import "object_detection/protos/box_predictor.proto"; import "object_detection/protos/hyperparams.proto"; import "object_detection/protos/image_resizer.proto"; import "object_detection/protos/losses.proto"; import "object_detection/protos/post_processing.proto"; // Configuration for Faster R-CNN models. // See meta_architectures/faster_rcnn_meta_arch.py and models/model_builder.py // // Naming conventions: // Faster R-CNN models have two stages: a first stage region proposal network // (or RPN) and a second stage box classifier. We thus use the prefixes // `first_stage_` and `second_stage_` to indicate the stage to which each // parameter pertains when relevant. message FasterRcnn { // Whether to construct only the Region Proposal Network (RPN). optional bool first_stage_only = 1 [default=false]; // Number of classes to predict. optional int32 num_classes = 3; // Image resizer for preprocessing the input image. optional ImageResizer image_resizer = 4; // Feature extractor config. optional FasterRcnnFeatureExtractor feature_extractor = 5; // (First stage) region proposal network (RPN) parameters. // Anchor generator to compute RPN anchors. optional AnchorGenerator first_stage_anchor_generator = 6; // Atrous rate for the convolution op applied to the // `first_stage_features_to_crop` tensor to obtain box predictions. optional int32 first_stage_atrous_rate = 7 [default=1]; // Hyperparameters for the convolutional RPN box predictor. optional Hyperparams first_stage_box_predictor_conv_hyperparams = 8; // Kernel size to use for the convolution op just prior to RPN box // predictions. optional int32 first_stage_box_predictor_kernel_size = 9 [default=3]; // Output depth for the convolution op just prior to RPN box predictions. optional int32 first_stage_box_predictor_depth = 10 [default=512]; // The batch size to use for computing the first stage objectness and // location losses. optional int32 first_stage_minibatch_size = 11 [default=256]; // Fraction of positive examples per image for the RPN. optional float first_stage_positive_balance_fraction = 12 [default=0.5]; // Non max suppression score threshold applied to first stage RPN proposals. optional float first_stage_nms_score_threshold = 13 [default=0.0]; // Non max suppression IOU threshold applied to first stage RPN proposals. optional float first_stage_nms_iou_threshold = 14 [default=0.7]; // Maximum number of RPN proposals retained after first stage postprocessing. optional int32 first_stage_max_proposals = 15 [default=300]; // First stage RPN localization loss weight. optional float first_stage_localization_loss_weight = 16 [default=1.0]; // First stage RPN objectness loss weight. optional float first_stage_objectness_loss_weight = 17 [default=1.0]; // Per-region cropping parameters. // Note that if a R-FCN model is constructed the per region cropping // parameters below are ignored. // Output size (width and height are set to be the same) of the initial // bilinear interpolation based cropping during ROI pooling. optional int32 initial_crop_size = 18; // Kernel size of the max pool op on the cropped feature map during // ROI pooling. optional int32 maxpool_kernel_size = 19; // Stride of the max pool op on the cropped feature map during ROI pooling. optional int32 maxpool_stride = 20; // (Second stage) box classifier parameters // Hyperparameters for the second stage box predictor. If box predictor type // is set to rfcn_box_predictor, a R-FCN model is constructed, otherwise a // Faster R-CNN model is constructed. optional BoxPredictor second_stage_box_predictor = 21; // The batch size per image used for computing the classification and refined // location loss of the box classifier. // Note that this field is ignored if `hard_example_miner` is configured. optional int32 second_stage_batch_size = 22 [default=64]; // Fraction of positive examples to use per image for the box classifier. optional float second_stage_balance_fraction = 23 [default=0.25]; // Post processing to apply on the second stage box classifier predictions. // Note: the `score_converter` provided to the FasterRCNNMetaArch constructor // is taken from this `second_stage_post_processing` proto. optional PostProcessing second_stage_post_processing = 24; // Second stage refined localization loss weight. optional float second_stage_localization_loss_weight = 25 [default=1.0]; // Second stage classification loss weight optional float second_stage_classification_loss_weight = 26 [default=1.0]; // If not left to default, applies hard example mining. optional HardExampleMiner hard_example_miner = 27; } message FasterRcnnFeatureExtractor { // Type of Faster R-CNN model (e.g., 'faster_rcnn_resnet101'; // See models/model_builder.py for expected types). optional string type = 1; // Output stride of extracted RPN feature map. optional int32 first_stage_features_stride = 2 [default=16]; }