@@ -198,6 +198,10 @@ def visual_predict(
198
198
use_general_ocr : Optional [bool ] = None ,
199
199
use_seal_recognition : Optional [bool ] = None ,
200
200
use_table_recognition : Optional [bool ] = None ,
201
+ layout_threshold : Optional [Union [float , dict ]] = None ,
202
+ layout_nms : Optional [bool ] = None ,
203
+ layout_unclip_ratio : Optional [Union [float , Tuple [float , float ], dict ]] = None ,
204
+ layout_merge_bboxes_mode : Optional [str ] = None ,
201
205
text_det_limit_side_len : Optional [int ] = None ,
202
206
text_det_limit_type : Optional [str ] = None ,
203
207
text_det_thresh : Optional [float ] = None ,
@@ -225,6 +229,26 @@ def visual_predict(
225
229
use_general_ocr (bool): Flag to use general OCR.
226
230
use_seal_recognition (bool): Flag to use seal recognition.
227
231
use_table_recognition (bool): Flag to use table recognition.
232
+ layout_threshold (Optional[float]): The threshold value to filter out low-confidence predictions. Default is None.
233
+ layout_nms (bool, optional): Whether to use layout-aware NMS. Defaults to False.
234
+ layout_unclip_ratio (Optional[Union[float, Tuple[float, float]]], optional): The ratio of unclipping the bounding box.
235
+ Defaults to None.
236
+ If it's a single number, then both width and height are used.
237
+ If it's a tuple of two numbers, then they are used separately for width and height respectively.
238
+ If it's None, then no unclipping will be performed.
239
+ layout_merge_bboxes_mode (Optional[str], optional): The mode for merging bounding boxes. Defaults to None.
240
+ text_det_limit_side_len (Optional[int]): Maximum side length for text detection.
241
+ text_det_limit_type (Optional[str]): Type of limit to apply for text detection.
242
+ text_det_thresh (Optional[float]): Threshold for text detection.
243
+ text_det_box_thresh (Optional[float]): Threshold for text detection boxes.
244
+ text_det_unclip_ratio (Optional[float]): Ratio for unclipping text detection boxes.
245
+ text_rec_score_thresh (Optional[float]): Score threshold for text recognition.
246
+ seal_det_limit_side_len (Optional[int]): Maximum side length for seal detection.
247
+ seal_det_limit_type (Optional[str]): Type of limit to apply for seal detection.
248
+ seal_det_thresh (Optional[float]): Threshold for seal detection.
249
+ seal_det_box_thresh (Optional[float]): Threshold for seal detection boxes.
250
+ seal_det_unclip_ratio (Optional[float]): Ratio for unclipping seal detection boxes.
251
+ seal_rec_score_thresh (Optional[float]): Score threshold for seal recognition.
228
252
**kwargs: Additional keyword arguments.
229
253
230
254
Returns:
@@ -248,6 +272,10 @@ def visual_predict(
248
272
use_general_ocr = use_general_ocr ,
249
273
use_seal_recognition = use_seal_recognition ,
250
274
use_table_recognition = use_table_recognition ,
275
+ layout_threshold = layout_threshold ,
276
+ layout_nms = layout_nms ,
277
+ layout_unclip_ratio = layout_unclip_ratio ,
278
+ layout_merge_bboxes_mode = layout_merge_bboxes_mode ,
251
279
text_det_limit_side_len = text_det_limit_side_len ,
252
280
text_det_limit_type = text_det_limit_type ,
253
281
text_det_thresh = text_det_thresh ,
0 commit comments