layer { name: "data" type: "AnnotatedData" top: "data" top: "label" include { phase: TRAIN } transform_param { mirror: true mean_value: 104 mean_value: 117 mean_value: 123 resize_param { prob: 1 resize_mode: WARP height: 300 width: 300 interp_mode: LINEAR interp_mode: AREA interp_mode: NEAREST interp_mode: CUBIC interp_mode: LANCZOS4 } emit_constraint { emit_type: CENTER } distort_param { brightness_prob: 0.5 brightness_delta: 32 contrast_prob: 0.5 contrast_lower: 0.5 contrast_upper: 1.5 hue_prob: 0.5 hue_delta: 18 saturation_prob: 0.5 saturation_lower: 0.5 saturation_upper: 1.5 random_order_prob: 0.0 } expand_param { prob: 0.5 max_expand_ratio: 4.0 } } data_param { source: "train_lmdb/" batch_size: 16 backend: LMDB } annotated_data_param { batch_sampler { max_sample: 1 max_trials: 1 } batch_sampler { sampler { min_scale: 0.3 max_scale: 1.0 min_aspect_ratio: 0.5 max_aspect_ratio: 2.0 } sample_constraint { min_jaccard_overlap: 0.1 } max_sample: 1 max_trials: 50 } batch_sampler { sampler { min_scale: 0.3 max_scale: 1.0 min_aspect_ratio: 0.5 max_aspect_ratio: 2.0 } sample_constraint { min_jaccard_overlap: 0.3 } max_sample: 1 max_trials: 50 } batch_sampler { sampler { min_scale: 0.3 max_scale: 1.0 min_aspect_ratio: 0.5 max_aspect_ratio: 2.0 } sample_constraint { min_jaccard_overlap: 0.5 } max_sample: 1 max_trials: 50 } batch_sampler { sampler { min_scale: 0.3 max_scale: 1.0 min_aspect_ratio: 0.5 max_aspect_ratio: 2.0 } sample_constraint { min_jaccard_overlap: 0.7 } max_sample: 1 max_trials: 50 } batch_sampler { sampler { min_scale: 0.3 max_scale: 1.0 min_aspect_ratio: 0.5 max_aspect_ratio: 2.0 } sample_constraint { min_jaccard_overlap: 0.9 } max_sample: 1 max_trials: 50 } batch_sampler { sampler { min_scale: 0.3 max_scale: 1.0 min_aspect_ratio: 0.5 max_aspect_ratio: 2.0 } sample_constraint { max_jaccard_overlap: 1.0 } max_sample: 1 max_trials: 50 } } } layer { name: "data_bn" type: "BatchNorm" bottom: "data" top: "data_bn" param { lr_mult: 0.0 } param { lr_mult: 0.0 } param { lr_mult: 0.0 } } layer { name: "data_scale" type: "Scale" bottom: "data_bn" top: "data_bn" param { lr_mult: 1.0 decay_mult: 1.0 } param { lr_mult: 2.0 decay_mult: 1.0 } scale_param { bias_term: true } } layer { name: "conv1_h" type: "Convolution" bottom: "data_bn" top: "conv1_h" param { lr_mult: 1.0 decay_mult: 1.0 } param { lr_mult: 2.0 decay_mult: 1.0 } convolution_param { num_output: 32 pad: 3 kernel_size: 7 stride: 2 weight_filler { type: "msra" variance_norm: FAN_OUT } bias_filler { type: "constant" value: 0.0 } } } layer { name: "conv1_bn_h" type: "BatchNorm" bottom: "conv1_h" top: "conv1_h" param { lr_mult: 0.0 } param { lr_mult: 0.0 } param { lr_mult: 0.0 } } layer { name: "conv1_scale_h" type: "Scale" bottom: "conv1_h" top: "conv1_h" param { lr_mult: 1.0 decay_mult: 1.0 } param { lr_mult: 2.0 decay_mult: 1.0 } scale_param { bias_term: true } } layer { name: "conv1_relu" type: "ReLU" bottom: "conv1_h" top: "conv1_h" } layer { name: "conv1_pool" type: "Pooling" bottom: "conv1_h" top: "conv1_pool" pooling_param { kernel_size: 3 stride: 2 } } layer { name: "layer_64_1_conv1_h" type: "Convolution" bottom: "conv1_pool" top: "layer_64_1_conv1_h" param { lr_mult: 1.0 decay_mult: 1.0 } convolution_param { num_output: 32 bias_term: false pad: 1 kernel_size: 3 stride: 1 weight_filler { type: "msra" } bias_filler { type: "constant" value: 0.0 } } } layer { name: "layer_64_1_bn2_h" type: "BatchNorm" bottom: "layer_64_1_conv1_h" top: "layer_64_1_conv1_h" param { lr_mult: 0.0 } param { lr_mult: 0.0 } param { lr_mult: 0.0 } } layer { name: "layer_64_1_scale2_h" type: "Scale" bottom: "layer_64_1_conv1_h" top: "layer_64_1_conv1_h" param { lr_mult: 1.0 decay_mult: 1.0 } param { lr_mult: 2.0 decay_mult: 1.0 } scale_param { bias_term: true } } layer { name: "layer_64_1_relu2" type: "ReLU" bottom: "layer_64_1_conv1_h" top: "layer_64_1_conv1_h" } layer { name: "layer_64_1_conv2_h" type: "Convolution" bottom: "layer_64_1_conv1_h" top: "layer_64_1_conv2_h" param { lr_mult: 1.0 decay_mult: 1.0 } convolution_param { num_output: 32 bias_term: false pad: 1 kernel_size: 3 stride: 1 weight_filler { type: "msra" } bias_filler { type: "constant" value: 0.0 } } } layer { name: "layer_64_1_sum" type: "Eltwise" bottom: "layer_64_1_conv2_h" bottom: "conv1_pool" top: "layer_64_1_sum" } layer { name: "layer_128_1_bn1_h" type: "BatchNorm" bottom: "layer_64_1_sum" top: "layer_128_1_bn1_h" param { lr_mult: 0.0 } param { lr_mult: 0.0 } param { lr_mult: 0.0 } } layer { name: "layer_128_1_scale1_h" type: "Scale" bottom: "layer_128_1_bn1_h" top: "layer_128_1_bn1_h" param { lr_mult: 1.0 decay_mult: 1.0 } param { lr_mult: 2.0 decay_mult: 1.0 } scale_param { bias_term: true } } layer { name: "layer_128_1_relu1" type: "ReLU" bottom: "layer_128_1_bn1_h" top: "layer_128_1_bn1_h" } layer { name: "layer_128_1_conv1_h" type: "Convolution" bottom: "layer_128_1_bn1_h" top: "layer_128_1_conv1_h" param { lr_mult: 1.0 decay_mult: 1.0 } convolution_param { num_output: 128 bias_term: false pad: 1 kernel_size: 3 stride: 2 weight_filler { type: "msra" } bias_filler { type: "constant" value: 0.0 } } } layer { name: "layer_128_1_bn2" type: "BatchNorm" bottom: "layer_128_1_conv1_h" top: "layer_128_1_conv1_h" param { lr_mult: 0.0 } param { lr_mult: 0.0 } param { lr_mult: 0.0 } } layer { name: "layer_128_1_scale2" type: "Scale" bottom: "layer_128_1_conv1_h" top: "layer_128_1_conv1_h" param { lr_mult: 1.0 decay_mult: 1.0 } param { lr_mult: 2.0 decay_mult: 1.0 } scale_param { bias_term: true } } layer { name: "layer_128_1_relu2" type: "ReLU" bottom: "layer_128_1_conv1_h" top: "layer_128_1_conv1_h" } layer { name: "layer_128_1_conv2" type: "Convolution" bottom: "layer_128_1_conv1_h" top: "layer_128_1_conv2" param { lr_mult: 1.0 decay_mult: 1.0 } convolution_param { num_output: 128 bias_term: false pad: 1 kernel_size: 3 stride: 1 weight_filler { type: "msra" } bias_filler { type: "constant" value: 0.0 } } } layer { name: "layer_128_1_conv_expand_h" type: "Convolution" bottom: "layer_128_1_bn1_h" top: "layer_128_1_conv_expand_h" param { lr_mult: 1.0 decay_mult: 1.0 } convolution_param { num_output: 128 bias_term: false pad: 0 kernel_size: 1 stride: 2 weight_filler { type: "msra" } bias_filler { type: "constant" value: 0.0 } } } layer { name: "layer_128_1_sum" type: "Eltwise" bottom: "layer_128_1_conv2" bottom: "layer_128_1_conv_expand_h" top: "layer_128_1_sum" } layer { name: "layer_256_1_bn1" type: "BatchNorm" bottom: "layer_128_1_sum" top: "layer_256_1_bn1" param { lr_mult: 0.0 } param { lr_mult: 0.0 } param { lr_mult: 0.0 } } layer { name: "layer_256_1_scale1" type: "Scale" bottom: "layer_256_1_bn1" top: "layer_256_1_bn1" param { lr_mult: 1.0 decay_mult: 1.0 } param { lr_mult: 2.0 decay_mult: 1.0 } scale_param { bias_term: true } } layer { name: "layer_256_1_relu1" type: "ReLU" bottom: "layer_256_1_bn1" top: "layer_256_1_bn1" } layer { name: "layer_256_1_conv1" type: "Convolution" bottom: "layer_256_1_bn1" top: "layer_256_1_conv1" param { lr_mult: 1.0 decay_mult: 1.0 } convolution_param { num_output: 256 bias_term: false pad: 1 kernel_size: 3 stride: 2 weight_filler { type: "msra" } bias_filler { type: "constant" value: 0.0 } } } layer { name: "layer_256_1_bn2" type: "BatchNorm" bottom: "layer_256_1_conv1" top: "layer_256_1_conv1" param { lr_mult: 0.0 } param { lr_mult: 0.0 } param { lr_mult: 0.0 } } layer { name: "layer_256_1_scale2" type: "Scale" bottom: "layer_256_1_conv1" top: "layer_256_1_conv1" param { lr_mult: 1.0 decay_mult: 1.0 } param { lr_mult: 2.0 decay_mult: 1.0 } scale_param { bias_term: true } } layer { name: "layer_256_1_relu2" type: "ReLU" bottom: "layer_256_1_conv1" top: "layer_256_1_conv1" } layer { name: "layer_256_1_conv2" type: "Convolution" bottom: "layer_256_1_conv1" top: "layer_256_1_conv2" param { lr_mult: 1.0 decay_mult: 1.0 } convolution_param { num_output: 256 bias_term: false pad: 1 kernel_size: 3 stride: 1 weight_filler { type: "msra" } bias_filler { type: "constant" value: 0.0 } } } layer { name: "layer_256_1_conv_expand" type: "Convolution" bottom: "layer_256_1_bn1" top: "layer_256_1_conv_expand" param { lr_mult: 1.0 decay_mult: 1.0 } convolution_param { num_output: 256 bias_term: false pad: 0 kernel_size: 1 stride: 2 weight_filler { type: "msra" } bias_filler { type: "constant" value: 0.0 } } } layer { name: "layer_256_1_sum" type: "Eltwise" bottom: "layer_256_1_conv2" bottom: "layer_256_1_conv_expand" top: "layer_256_1_sum" } layer { name: "layer_512_1_bn1" type: "BatchNorm" bottom: "layer_256_1_sum" top: "layer_512_1_bn1" param { lr_mult: 0.0 } param { lr_mult: 0.0 } param { lr_mult: 0.0 } } layer { name: "layer_512_1_scale1" type: "Scale" bottom: "layer_512_1_bn1" top: "layer_512_1_bn1" param { lr_mult: 1.0 decay_mult: 1.0 } param { lr_mult: 2.0 decay_mult: 1.0 } scale_param { bias_term: true } } layer { name: "layer_512_1_relu1" type: "ReLU" bottom: "layer_512_1_bn1" top: "layer_512_1_bn1" } layer { name: "layer_512_1_conv1_h" type: "Convolution" bottom: "layer_512_1_bn1" top: "layer_512_1_conv1_h" param { lr_mult: 1.0 decay_mult: 1.0 } convolution_param { num_output: 128 bias_term: false pad: 1 kernel_size: 3 stride: 1 # 2 weight_filler { type: "msra" } bias_filler { type: "constant" value: 0.0 } } } layer { name: "layer_512_1_bn2_h" type: "BatchNorm" bottom: "layer_512_1_conv1_h" top: "layer_512_1_conv1_h" param { lr_mult: 0.0 } param { lr_mult: 0.0 } param { lr_mult: 0.0 } } layer { name: "layer_512_1_scale2_h" type: "Scale" bottom: "layer_512_1_conv1_h" top: "layer_512_1_conv1_h" param { lr_mult: 1.0 decay_mult: 1.0 } param { lr_mult: 2.0 decay_mult: 1.0 } scale_param { bias_term: true } } layer { name: "layer_512_1_relu2" type: "ReLU" bottom: "layer_512_1_conv1_h" top: "layer_512_1_conv1_h" } layer { name: "layer_512_1_conv2_h" type: "Convolution" bottom: "layer_512_1_conv1_h" top: "layer_512_1_conv2_h" param { lr_mult: 1.0 decay_mult: 1.0 } convolution_param { num_output: 256 bias_term: false pad: 2 # 1 kernel_size: 3 stride: 1 dilation: 2 weight_filler { type: "msra" } bias_filler { type: "constant" value: 0.0 } } } layer { name: "layer_512_1_conv_expand_h" type: "Convolution" bottom: "layer_512_1_bn1" top: "layer_512_1_conv_expand_h" param { lr_mult: 1.0 decay_mult: 1.0 } convolution_param { num_output: 256 bias_term: false pad: 0 kernel_size: 1 stride: 1 # 2 weight_filler { type: "msra" } bias_filler { type: "constant" value: 0.0 } } } layer { name: "layer_512_1_sum" type: "Eltwise" bottom: "layer_512_1_conv2_h" bottom: "layer_512_1_conv_expand_h" top: "layer_512_1_sum" } layer { name: "last_bn_h" type: "BatchNorm" bottom: "layer_512_1_sum" top: "layer_512_1_sum" param { lr_mult: 0.0 } param { lr_mult: 0.0 } param { lr_mult: 0.0 } } layer { name: "last_scale_h" type: "Scale" bottom: "layer_512_1_sum" top: "layer_512_1_sum" param { lr_mult: 1.0 decay_mult: 1.0 } param { lr_mult: 2.0 decay_mult: 1.0 } scale_param { bias_term: true } } layer { name: "last_relu" type: "ReLU" bottom: "layer_512_1_sum" top: "fc7" } layer { name: "conv6_1_h" type: "Convolution" bottom: "fc7" top: "conv6_1_h" param { lr_mult: 1 decay_mult: 1 } param { lr_mult: 2 decay_mult: 0 } convolution_param { num_output: 128 pad: 0 kernel_size: 1 stride: 1 weight_filler { type: "xavier" } bias_filler { type: "constant" value: 0 } } } layer { name: "conv6_1_relu" type: "ReLU" bottom: "conv6_1_h" top: "conv6_1_h" } layer { name: "conv6_2_h" type: "Convolution" bottom: "conv6_1_h" top: "conv6_2_h" param { lr_mult: 1 decay_mult: 1 } param { lr_mult: 2 decay_mult: 0 } convolution_param { num_output: 256 pad: 1 kernel_size: 3 stride: 2 weight_filler { type: "xavier" } bias_filler { type: "constant" value: 0 } } } layer { name: "conv6_2_relu" type: "ReLU" bottom: "conv6_2_h" top: "conv6_2_h" } layer { name: "conv7_1_h" type: "Convolution" bottom: "conv6_2_h" top: "conv7_1_h" param { lr_mult: 1 decay_mult: 1 } param { lr_mult: 2 decay_mult: 0 } convolution_param { num_output: 64 pad: 0 kernel_size: 1 stride: 1 weight_filler { type: "xavier" } bias_filler { type: "constant" value: 0 } } } layer { name: "conv7_1_relu" type: "ReLU" bottom: "conv7_1_h" top: "conv7_1_h" } layer { name: "conv7_2_h" type: "Convolution" bottom: "conv7_1_h" top: "conv7_2_h" param { lr_mult: 1 decay_mult: 1 } param { lr_mult: 2 decay_mult: 0 } convolution_param { num_output: 128 pad: 1 kernel_size: 3 stride: 2 weight_filler { type: "xavier" } bias_filler { type: "constant" value: 0 } } } layer { name: "conv7_2_relu" type: "ReLU" bottom: "conv7_2_h" top: "conv7_2_h" } layer { name: "conv8_1_h" type: "Convolution" bottom: "conv7_2_h" top: "conv8_1_h" param { lr_mult: 1 decay_mult: 1 } param { lr_mult: 2 decay_mult: 0 } convolution_param { num_output: 64 pad: 0 kernel_size: 1 stride: 1 weight_filler { type: "xavier" } bias_filler { type: "constant" value: 0 } } } layer { name: "conv8_1_relu" type: "ReLU" bottom: "conv8_1_h" top: "conv8_1_h" } layer { name: "conv8_2_h" type: "Convolution" bottom: "conv8_1_h" top: "conv8_2_h" param { lr_mult: 1 decay_mult: 1 } param { lr_mult: 2 decay_mult: 0 } convolution_param { num_output: 128 pad: 1 kernel_size: 3 stride: 1 weight_filler { type: "xavier" } bias_filler { type: "constant" value: 0 } } } layer { name: "conv8_2_relu" type: "ReLU" bottom: "conv8_2_h" top: "conv8_2_h" } layer { name: "conv9_1_h" type: "Convolution" bottom: "conv8_2_h" top: "conv9_1_h" param { lr_mult: 1 decay_mult: 1 } param { lr_mult: 2 decay_mult: 0 } convolution_param { num_output: 64 pad: 0 kernel_size: 1 stride: 1 weight_filler { type: "xavier" } bias_filler { type: "constant" value: 0 } } } layer { name: "conv9_1_relu" type: "ReLU" bottom: "conv9_1_h" top: "conv9_1_h" } layer { name: "conv9_2_h" type: "Convolution" bottom: "conv9_1_h" top: "conv9_2_h" param { lr_mult: 1 decay_mult: 1 } param { lr_mult: 2 decay_mult: 0 } convolution_param { num_output: 128 pad: 0 kernel_size: 3 stride: 1 weight_filler { type: "xavier" } bias_filler { type: "constant" value: 0 } } } layer { name: "conv9_2_relu" type: "ReLU" bottom: "conv9_2_h" top: "conv9_2_h" } layer { name: "conv4_3_norm" type: "Normalize" bottom: "layer_256_1_bn1" top: "conv4_3_norm" norm_param { across_spatial: false scale_filler { type: "constant" value: 20 } channel_shared: false } } layer { name: "conv4_3_norm_mbox_loc" type: "Convolution" bottom: "conv4_3_norm" top: "conv4_3_norm_mbox_loc" param { lr_mult: 1 decay_mult: 1 } param { lr_mult: 2 decay_mult: 0 } convolution_param { num_output: 16 pad: 1 kernel_size: 3 stride: 1 weight_filler { type: "xavier" } bias_filler { type: "constant" value: 0 } } } layer { name: "conv4_3_norm_mbox_loc_perm" type: "Permute" bottom: "conv4_3_norm_mbox_loc" top: "conv4_3_norm_mbox_loc_perm" permute_param { order: 0 order: 2 order: 3 order: 1 } } layer { name: "conv4_3_norm_mbox_loc_flat" type: "Flatten" bottom: "conv4_3_norm_mbox_loc_perm" top: "conv4_3_norm_mbox_loc_flat" flatten_param { axis: 1 } } layer { name: "conv4_3_norm_mbox_conf" type: "Convolution" bottom: "conv4_3_norm" top: "conv4_3_norm_mbox_conf" param { lr_mult: 1 decay_mult: 1 } param { lr_mult: 2 decay_mult: 0 } convolution_param { num_output: 8 # 84 pad: 1 kernel_size: 3 stride: 1 weight_filler { type: "xavier" } bias_filler { type: "constant" value: 0 } } } layer { name: "conv4_3_norm_mbox_conf_perm" type: "Permute" bottom: "conv4_3_norm_mbox_conf" top: "conv4_3_norm_mbox_conf_perm" permute_param { order: 0 order: 2 order: 3 order: 1 } } layer { name: "conv4_3_norm_mbox_conf_flat" type: "Flatten" bottom: "conv4_3_norm_mbox_conf_perm" top: "conv4_3_norm_mbox_conf_flat" flatten_param { axis: 1 } } layer { name: "conv4_3_norm_mbox_priorbox" type: "PriorBox" bottom: "conv4_3_norm" bottom: "data" top: "conv4_3_norm_mbox_priorbox" prior_box_param { min_size: 30.0 max_size: 60.0 aspect_ratio: 2 flip: true clip: false variance: 0.1 variance: 0.1 variance: 0.2 variance: 0.2 step: 8 offset: 0.5 } } layer { name: "fc7_mbox_loc" type: "Convolution" bottom: "fc7" top: "fc7_mbox_loc" param { lr_mult: 1 decay_mult: 1 } param { lr_mult: 2 decay_mult: 0 } convolution_param { num_output: 24 pad: 1 kernel_size: 3 stride: 1 weight_filler { type: "xavier" } bias_filler { type: "constant" value: 0 } } } layer { name: "fc7_mbox_loc_perm" type: "Permute" bottom: "fc7_mbox_loc" top: "fc7_mbox_loc_perm" permute_param { order: 0 order: 2 order: 3 order: 1 } } layer { name: "fc7_mbox_loc_flat" type: "Flatten" bottom: "fc7_mbox_loc_perm" top: "fc7_mbox_loc_flat" flatten_param { axis: 1 } } layer { name: "fc7_mbox_conf" type: "Convolution" bottom: "fc7" top: "fc7_mbox_conf" param { lr_mult: 1 decay_mult: 1 } param { lr_mult: 2 decay_mult: 0 } convolution_param { num_output: 12 # 126 pad: 1 kernel_size: 3 stride: 1 weight_filler { type: "xavier" } bias_filler { type: "constant" value: 0 } } } layer { name: "fc7_mbox_conf_perm" type: "Permute" bottom: "fc7_mbox_conf" top: "fc7_mbox_conf_perm" permute_param { order: 0 order: 2 order: 3 order: 1 } } layer { name: "fc7_mbox_conf_flat" type: "Flatten" bottom: "fc7_mbox_conf_perm" top: "fc7_mbox_conf_flat" flatten_param { axis: 1 } } layer { name: "fc7_mbox_priorbox" type: "PriorBox" bottom: "fc7" bottom: "data" top: "fc7_mbox_priorbox" prior_box_param { min_size: 60.0 max_size: 111.0 aspect_ratio: 2 aspect_ratio: 3 flip: true clip: false variance: 0.1 variance: 0.1 variance: 0.2 variance: 0.2 step: 16 offset: 0.5 } } layer { name: "conv6_2_mbox_loc" type: "Convolution" bottom: "conv6_2_h" top: "conv6_2_mbox_loc" param { lr_mult: 1 decay_mult: 1 } param { lr_mult: 2 decay_mult: 0 } convolution_param { num_output: 24 pad: 1 kernel_size: 3 stride: 1 weight_filler { type: "xavier" } bias_filler { type: "constant" value: 0 } } } layer { name: "conv6_2_mbox_loc_perm" type: "Permute" bottom: "conv6_2_mbox_loc" top: "conv6_2_mbox_loc_perm" permute_param { order: 0 order: 2 order: 3 order: 1 } } layer { name: "conv6_2_mbox_loc_flat" type: "Flatten" bottom: "conv6_2_mbox_loc_perm" top: "conv6_2_mbox_loc_flat" flatten_param { axis: 1 } } layer { name: "conv6_2_mbox_conf" type: "Convolution" bottom: "conv6_2_h" top: "conv6_2_mbox_conf" param { lr_mult: 1 decay_mult: 1 } param { lr_mult: 2 decay_mult: 0 } convolution_param { num_output: 12 # 126 pad: 1 kernel_size: 3 stride: 1 weight_filler { type: "xavier" } bias_filler { type: "constant" value: 0 } } } layer { name: "conv6_2_mbox_conf_perm" type: "Permute" bottom: "conv6_2_mbox_conf" top: "conv6_2_mbox_conf_perm" permute_param { order: 0 order: 2 order: 3 order: 1 } } layer { name: "conv6_2_mbox_conf_flat" type: "Flatten" bottom: "conv6_2_mbox_conf_perm" top: "conv6_2_mbox_conf_flat" flatten_param { axis: 1 } } layer { name: "conv6_2_mbox_priorbox" type: "PriorBox" bottom: "conv6_2_h" bottom: "data" top: "conv6_2_mbox_priorbox" prior_box_param { min_size: 111.0 max_size: 162.0 aspect_ratio: 2 aspect_ratio: 3 flip: true clip: false variance: 0.1 variance: 0.1 variance: 0.2 variance: 0.2 step: 32 offset: 0.5 } } layer { name: "conv7_2_mbox_loc" type: "Convolution" bottom: "conv7_2_h" top: "conv7_2_mbox_loc" param { lr_mult: 1 decay_mult: 1 } param { lr_mult: 2 decay_mult: 0 } convolution_param { num_output: 24 pad: 1 kernel_size: 3 stride: 1 weight_filler { type: "xavier" } bias_filler { type: "constant" value: 0 } } } layer { name: "conv7_2_mbox_loc_perm" type: "Permute" bottom: "conv7_2_mbox_loc" top: "conv7_2_mbox_loc_perm" permute_param { order: 0 order: 2 order: 3 order: 1 } } layer { name: "conv7_2_mbox_loc_flat" type: "Flatten" bottom: "conv7_2_mbox_loc_perm" top: "conv7_2_mbox_loc_flat" flatten_param { axis: 1 } } layer { name: "conv7_2_mbox_conf" type: "Convolution" bottom: "conv7_2_h" top: "conv7_2_mbox_conf" param { lr_mult: 1 decay_mult: 1 } param { lr_mult: 2 decay_mult: 0 } convolution_param { num_output: 12 # 126 pad: 1 kernel_size: 3 stride: 1 weight_filler { type: "xavier" } bias_filler { type: "constant" value: 0 } } } layer { name: "conv7_2_mbox_conf_perm" type: "Permute" bottom: "conv7_2_mbox_conf" top: "conv7_2_mbox_conf_perm" permute_param { order: 0 order: 2 order: 3 order: 1 } } layer { name: "conv7_2_mbox_conf_flat" type: "Flatten" bottom: "conv7_2_mbox_conf_perm" top: "conv7_2_mbox_conf_flat" flatten_param { axis: 1 } } layer { name: "conv7_2_mbox_priorbox" type: "PriorBox" bottom: "conv7_2_h" bottom: "data" top: "conv7_2_mbox_priorbox" prior_box_param { min_size: 162.0 max_size: 213.0 aspect_ratio: 2 aspect_ratio: 3 flip: true clip: false variance: 0.1 variance: 0.1 variance: 0.2 variance: 0.2 step: 64 offset: 0.5 } } layer { name: "conv8_2_mbox_loc" type: "Convolution" bottom: "conv8_2_h" top: "conv8_2_mbox_loc" param { lr_mult: 1 decay_mult: 1 } param { lr_mult: 2 decay_mult: 0 } convolution_param { num_output: 16 pad: 0 kernel_size: 3 stride: 1 weight_filler { type: "xavier" } bias_filler { type: "constant" value: 0 } } } layer { name: "conv8_2_mbox_loc_perm" type: "Permute" bottom: "conv8_2_mbox_loc" top: "conv8_2_mbox_loc_perm" permute_param { order: 0 order: 2 order: 3 order: 1 } } layer { name: "conv8_2_mbox_loc_flat" type: "Flatten" bottom: "conv8_2_mbox_loc_perm" top: "conv8_2_mbox_loc_flat" flatten_param { axis: 1 } } layer { name: "conv8_2_mbox_conf" type: "Convolution" bottom: "conv8_2_h" top: "conv8_2_mbox_conf" param { lr_mult: 1 decay_mult: 1 } param { lr_mult: 2 decay_mult: 0 } convolution_param { num_output: 8 # 84 pad: 1 kernel_size: 3 stride: 1 weight_filler { type: "xavier" } bias_filler { type: "constant" value: 0 } } } layer { name: "conv8_2_mbox_conf_perm" type: "Permute" bottom: "conv8_2_mbox_conf" top: "conv8_2_mbox_conf_perm" permute_param { order: 0 order: 2 order: 3 order: 1 } } layer { name: "conv8_2_mbox_conf_flat" type: "Flatten" bottom: "conv8_2_mbox_conf_perm" top: "conv8_2_mbox_conf_flat" flatten_param { axis: 1 } } layer { name: "conv8_2_mbox_priorbox" type: "PriorBox" bottom: "conv8_2_h" bottom: "data" top: "conv8_2_mbox_priorbox" prior_box_param { min_size: 213.0 max_size: 264.0 aspect_ratio: 2 flip: true clip: false variance: 0.1 variance: 0.1 variance: 0.2 variance: 0.2 step: 100 offset: 0.5 } } layer { name: "conv9_2_mbox_loc" type: "Convolution" bottom: "conv9_2_h" top: "conv9_2_mbox_loc" param { lr_mult: 1 decay_mult: 1 } param { lr_mult: 2 decay_mult: 0 } convolution_param { num_output: 16 pad: 1 kernel_size: 3 stride: 1 weight_filler { type: "xavier" } bias_filler { type: "constant" value: 0 } } } layer { name: "conv9_2_mbox_loc_perm" type: "Permute" bottom: "conv9_2_mbox_loc" top: "conv9_2_mbox_loc_perm" permute_param { order: 0 order: 2 order: 3 order: 1 } } layer { name: "conv9_2_mbox_loc_flat" type: "Flatten" bottom: "conv9_2_mbox_loc_perm" top: "conv9_2_mbox_loc_flat" flatten_param { axis: 1 } } layer { name: "conv9_2_mbox_conf" type: "Convolution" bottom: "conv9_2_h" top: "conv9_2_mbox_conf" param { lr_mult: 1 decay_mult: 1 } param { lr_mult: 2 decay_mult: 0 } convolution_param { num_output: 8 # 84 pad: 1 kernel_size: 3 stride: 1 weight_filler { type: "xavier" } bias_filler { type: "constant" value: 0 } } } layer { name: "conv9_2_mbox_conf_perm" type: "Permute" bottom: "conv9_2_mbox_conf" top: "conv9_2_mbox_conf_perm" permute_param { order: 0 order: 2 order: 3 order: 1 } } layer { name: "conv9_2_mbox_conf_flat" type: "Flatten" bottom: "conv9_2_mbox_conf_perm" top: "conv9_2_mbox_conf_flat" flatten_param { axis: 1 } } layer { name: "conv9_2_mbox_priorbox" type: "PriorBox" bottom: "conv9_2_h" bottom: "data" top: "conv9_2_mbox_priorbox" prior_box_param { min_size: 264.0 max_size: 315.0 aspect_ratio: 2 flip: true clip: false variance: 0.1 variance: 0.1 variance: 0.2 variance: 0.2 step: 300 offset: 0.5 } } layer { name: "mbox_loc" type: "Concat" bottom: "conv4_3_norm_mbox_loc_flat" bottom: "fc7_mbox_loc_flat" bottom: "conv6_2_mbox_loc_flat" bottom: "conv7_2_mbox_loc_flat" bottom: "conv8_2_mbox_loc_flat" bottom: "conv9_2_mbox_loc_flat" top: "mbox_loc" concat_param { axis: 1 } } layer { name: "mbox_conf" type: "Concat" bottom: "conv4_3_norm_mbox_conf_flat" bottom: "fc7_mbox_conf_flat" bottom: "conv6_2_mbox_conf_flat" bottom: "conv7_2_mbox_conf_flat" bottom: "conv8_2_mbox_conf_flat" bottom: "conv9_2_mbox_conf_flat" top: "mbox_conf" concat_param { axis: 1 } } layer { name: "mbox_priorbox" type: "Concat" bottom: "conv4_3_norm_mbox_priorbox" bottom: "fc7_mbox_priorbox" bottom: "conv6_2_mbox_priorbox" bottom: "conv7_2_mbox_priorbox" bottom: "conv8_2_mbox_priorbox" bottom: "conv9_2_mbox_priorbox" top: "mbox_priorbox" concat_param { axis: 2 } } layer { name: "mbox_loss" type: "MultiBoxLoss" bottom: "mbox_loc" bottom: "mbox_conf" bottom: "mbox_priorbox" bottom: "label" top: "mbox_loss" include { phase: TRAIN } propagate_down: true propagate_down: true propagate_down: false propagate_down: false loss_param { normalization: VALID } multibox_loss_param { loc_loss_type: SMOOTH_L1 conf_loss_type: SOFTMAX loc_weight: 1.0 num_classes: 2 # 21 share_location: true match_type: PER_PREDICTION overlap_threshold: 0.5 use_prior_for_matching: true background_label_id: 0 use_difficult_gt: true neg_pos_ratio: 3.0 neg_overlap: 0.5 code_type: CENTER_SIZE ignore_cross_boundary_bbox: false mining_type: MAX_NEGATIVE } }