@@ -68,12 +68,13 @@ def grounding_dino(
68
68
box_threshold (float, optional): The threshold for the box detection. Defaults
69
69
to 0.20.
70
70
iou_threshold (float, optional): The threshold for the Intersection over Union
71
- (IoU). Defaults to 0.75 .
71
+ (IoU). Defaults to 0.20 .
72
72
73
73
Returns:
74
74
List[Dict[str, Any]]: A list of dictionaries containing the score, label, and
75
75
bounding box of the detected objects with normalized coordinates
76
- (x1, y1, x2, y2).
76
+ (xmin, ymin, xmax, ymax). xmin and ymin are the coordinates of the top-left and
77
+ xmax and ymax are the coordinates of the bottom-right of the bounding box.
77
78
78
79
Example
79
80
-------
@@ -120,12 +121,15 @@ def grounding_sam(
120
121
box_threshold (float, optional): The threshold for the box detection. Defaults
121
122
to 0.20.
122
123
iou_threshold (float, optional): The threshold for the Intersection over Union
123
- (IoU). Defaults to 0.75 .
124
+ (IoU). Defaults to 0.20 .
124
125
125
126
Returns:
126
127
List[Dict[str, Any]]: A list of dictionaries containing the score, label,
127
128
bounding box, and mask of the detected objects with normalized coordinates
128
- (x1, y1, x2, y2).
129
+ (xmin, ymin, xmax, ymax). xmin and ymin are the coordinates of the top-left and
130
+ xmax and ymax are the coordinates of the bottom-right of the bounding box.
131
+ The mask is binary 2D numpy array where 1 indicates the object and 0 indicates
132
+ the background.
129
133
130
134
Example
131
135
-------
0 commit comments