98 lines
		
	
	
		
			3.4 KiB
		
	
	
	
		
			Protocol Buffer
		
	
	
	
	
	
			
		
		
	
	
			98 lines
		
	
	
		
			3.4 KiB
		
	
	
	
		
			Protocol Buffer
		
	
	
	
	
	
// Copyright 2019 The MediaPipe Authors.
 | 
						|
//
 | 
						|
// Licensed under the Apache License, Version 2.0 (the "License");
 | 
						|
// you may not use this file except in compliance with the License.
 | 
						|
// You may obtain a copy of the License at
 | 
						|
//
 | 
						|
//      http://www.apache.org/licenses/LICENSE-2.0
 | 
						|
//
 | 
						|
// Unless required by applicable law or agreed to in writing, software
 | 
						|
// distributed under the License is distributed on an "AS IS" BASIS,
 | 
						|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 | 
						|
// See the License for the specific language governing permissions and
 | 
						|
// limitations under the License.
 | 
						|
 | 
						|
syntax = "proto2";
 | 
						|
 | 
						|
package mediapipe;
 | 
						|
 | 
						|
import "mediapipe/util/tracking/box_tracker.proto";
 | 
						|
import "mediapipe/util/tracking/region_flow.proto";
 | 
						|
 | 
						|
option java_package = "com.google.mediapipe.tracking";
 | 
						|
option java_outer_classname = "BoxDetectorProto";
 | 
						|
 | 
						|
message BoxDetectorOptions {
 | 
						|
  // Available types of detector's index and search structure.
 | 
						|
  enum IndexType {
 | 
						|
    INDEX_UNSPECIFIED = 0;
 | 
						|
    // BFMatcher from OpenCV
 | 
						|
    OPENCV_BF = 1;
 | 
						|
  }
 | 
						|
 | 
						|
  optional IndexType index_type = 1 [default = OPENCV_BF];
 | 
						|
 | 
						|
  // Decide whether we force detector run every N frame.
 | 
						|
  // 0 means detection will never be called.
 | 
						|
  // 1 means detect every frame. 2 means detect every other frame. etc..
 | 
						|
  // Currently only applied to image query mode.
 | 
						|
  optional int32 detect_every_n_frame = 2 [default = 0];
 | 
						|
 | 
						|
  // Enable box detection when tracked boxes is out of FOV. Detection will be
 | 
						|
  // ceased after the detector successfully re-acquire the box.
 | 
						|
  optional bool detect_out_of_fov = 4 [default = false];
 | 
						|
 | 
						|
  // Options only for detection from image queries.
 | 
						|
  message ImageQuerySettings {
 | 
						|
    // Resize the input image's longer edge to this size. Skip resizing if the
 | 
						|
    // input size is already smaller than this size.
 | 
						|
    optional int32 pyramid_bottom_size = 1 [default = 640];
 | 
						|
 | 
						|
    // Scale factor between adjacent pyramid levels.
 | 
						|
    optional float pyramid_scale_factor = 2 [default = 1.2];
 | 
						|
 | 
						|
    // Maximum number of pyramid levels.
 | 
						|
    optional int32 max_pyramid_levels = 3 [default = 4];
 | 
						|
 | 
						|
    // Max number of features the detector uses.
 | 
						|
    optional int32 max_features = 4 [default = 500];
 | 
						|
  }
 | 
						|
 | 
						|
  // Options for detection function with image query.
 | 
						|
  optional ImageQuerySettings image_query_settings = 3;
 | 
						|
 | 
						|
  // Dimensions (number of elements) for feature descriptor.
 | 
						|
  optional int32 descriptor_dims = 5 [default = 40];
 | 
						|
 | 
						|
  // Minimum number of correspondence to go through RANSAC.
 | 
						|
  optional int32 min_num_correspondence = 6 [default = 5];
 | 
						|
 | 
						|
  // Reprojection threshold for RANSAC to find inliers.
 | 
						|
  optional float ransac_reprojection_threshold = 7 [default = 0.005];
 | 
						|
 | 
						|
  // Max distance to match 2 NIMBY features.
 | 
						|
  optional float max_match_distance = 8 [default = 0.9];
 | 
						|
 | 
						|
  // Max persepective change factor.
 | 
						|
  optional float max_perspective_factor = 9 [default = 0.1];
 | 
						|
}
 | 
						|
 | 
						|
// Proto to hold BoxDetector's internal search index.
 | 
						|
message BoxDetectorIndex {
 | 
						|
  // Message to hold keypoints and descriptors for each box.
 | 
						|
  message BoxEntry {
 | 
						|
    // Message to hold keypoints and descriptors for each appearance. One box
 | 
						|
    // could have multiple appearances to account for shape and perspective
 | 
						|
    // change, etc..
 | 
						|
    message FrameEntry {
 | 
						|
      optional TimedBoxProto box = 1;
 | 
						|
      repeated float keypoints = 2;
 | 
						|
      repeated BinaryFeatureDescriptor descriptors = 3;
 | 
						|
    }
 | 
						|
 | 
						|
    repeated FrameEntry frame_entry = 1;
 | 
						|
  }
 | 
						|
 | 
						|
  repeated BoxEntry box_entry = 1;
 | 
						|
}
 |