Skip to content

Commit 1ed56da

Browse files
committed
add args for pp-chatocr visual_predict (#3624)
1 parent 58417d8 commit 1ed56da

File tree

4 files changed

+58
-2
lines changed

4 files changed

+58
-2
lines changed

paddlex/inference/pipelines/layout_parsing/pipeline.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -378,7 +378,7 @@ def predict(
378378
use_formula_recognition: Optional[bool] = None,
379379
layout_threshold: Optional[Union[float, dict]] = None,
380380
layout_nms: Optional[bool] = None,
381-
layout_unclip_ratio: Optional[Union[float, Tuple[float, float]]] = None,
381+
layout_unclip_ratio: Optional[Union[float, Tuple[float, float], dict]] = None,
382382
layout_merge_bboxes_mode: Optional[str] = None,
383383
text_det_limit_side_len: Optional[int] = None,
384384
text_det_limit_type: Optional[str] = None,

paddlex/inference/pipelines/layout_parsing/pipeline_v2.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -414,7 +414,7 @@ def predict(
414414
use_formula_recognition: Union[bool, None] = None,
415415
layout_threshold: Optional[Union[float, dict]] = None,
416416
layout_nms: Optional[bool] = None,
417-
layout_unclip_ratio: Optional[Union[float, Tuple[float, float]]] = None,
417+
layout_unclip_ratio: Optional[Union[float, Tuple[float, float], dict]] = None,
418418
layout_merge_bboxes_mode: Optional[str] = None,
419419
text_det_limit_side_len: Union[int, None] = None,
420420
text_det_limit_type: Union[str, None] = None,

paddlex/inference/pipelines/pp_chatocr/pipeline_v3.py

Lines changed: 28 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -198,6 +198,10 @@ def visual_predict(
198198
use_general_ocr: Optional[bool] = None,
199199
use_seal_recognition: Optional[bool] = None,
200200
use_table_recognition: Optional[bool] = None,
201+
layout_threshold: Optional[Union[float, dict]] = None,
202+
layout_nms: Optional[bool] = None,
203+
layout_unclip_ratio: Optional[Union[float, Tuple[float, float], dict]] = None,
204+
layout_merge_bboxes_mode: Optional[str] = None,
201205
text_det_limit_side_len: Optional[int] = None,
202206
text_det_limit_type: Optional[str] = None,
203207
text_det_thresh: Optional[float] = None,
@@ -225,6 +229,26 @@ def visual_predict(
225229
use_general_ocr (bool): Flag to use general OCR.
226230
use_seal_recognition (bool): Flag to use seal recognition.
227231
use_table_recognition (bool): Flag to use table recognition.
232+
layout_threshold (Optional[float]): The threshold value to filter out low-confidence predictions. Default is None.
233+
layout_nms (bool, optional): Whether to use layout-aware NMS. Defaults to False.
234+
layout_unclip_ratio (Optional[Union[float, Tuple[float, float]]], optional): The ratio of unclipping the bounding box.
235+
Defaults to None.
236+
If it's a single number, then both width and height are used.
237+
If it's a tuple of two numbers, then they are used separately for width and height respectively.
238+
If it's None, then no unclipping will be performed.
239+
layout_merge_bboxes_mode (Optional[str], optional): The mode for merging bounding boxes. Defaults to None.
240+
text_det_limit_side_len (Optional[int]): Maximum side length for text detection.
241+
text_det_limit_type (Optional[str]): Type of limit to apply for text detection.
242+
text_det_thresh (Optional[float]): Threshold for text detection.
243+
text_det_box_thresh (Optional[float]): Threshold for text detection boxes.
244+
text_det_unclip_ratio (Optional[float]): Ratio for unclipping text detection boxes.
245+
text_rec_score_thresh (Optional[float]): Score threshold for text recognition.
246+
seal_det_limit_side_len (Optional[int]): Maximum side length for seal detection.
247+
seal_det_limit_type (Optional[str]): Type of limit to apply for seal detection.
248+
seal_det_thresh (Optional[float]): Threshold for seal detection.
249+
seal_det_box_thresh (Optional[float]): Threshold for seal detection boxes.
250+
seal_det_unclip_ratio (Optional[float]): Ratio for unclipping seal detection boxes.
251+
seal_rec_score_thresh (Optional[float]): Score threshold for seal recognition.
228252
**kwargs: Additional keyword arguments.
229253
230254
Returns:
@@ -248,6 +272,10 @@ def visual_predict(
248272
use_general_ocr=use_general_ocr,
249273
use_seal_recognition=use_seal_recognition,
250274
use_table_recognition=use_table_recognition,
275+
layout_threshold=layout_threshold,
276+
layout_nms=layout_nms,
277+
layout_unclip_ratio=layout_unclip_ratio,
278+
layout_merge_bboxes_mode=layout_merge_bboxes_mode,
251279
text_det_limit_side_len=text_det_limit_side_len,
252280
text_det_limit_type=text_det_limit_type,
253281
text_det_thresh=text_det_thresh,

paddlex/inference/pipelines/pp_chatocr/pipeline_v4.py

Lines changed: 28 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -235,6 +235,10 @@ def visual_predict(
235235
use_general_ocr: Optional[bool] = None,
236236
use_seal_recognition: Optional[bool] = None,
237237
use_table_recognition: Optional[bool] = None,
238+
layout_threshold: Optional[Union[float, dict]] = None,
239+
layout_nms: Optional[bool] = None,
240+
layout_unclip_ratio: Optional[Union[float, Tuple[float, float], dict]] = None,
241+
layout_merge_bboxes_mode: Optional[str] = None,
238242
text_det_limit_side_len: Optional[int] = None,
239243
text_det_limit_type: Optional[str] = None,
240244
text_det_thresh: Optional[float] = None,
@@ -262,6 +266,26 @@ def visual_predict(
262266
use_general_ocr (bool): Flag to use general OCR.
263267
use_seal_recognition (bool): Flag to use seal recognition.
264268
use_table_recognition (bool): Flag to use table recognition.
269+
layout_threshold (Optional[float]): The threshold value to filter out low-confidence predictions. Default is None.
270+
layout_nms (bool, optional): Whether to use layout-aware NMS. Defaults to False.
271+
layout_unclip_ratio (Optional[Union[float, Tuple[float, float]]], optional): The ratio of unclipping the bounding box.
272+
Defaults to None.
273+
If it's a single number, then both width and height are used.
274+
If it's a tuple of two numbers, then they are used separately for width and height respectively.
275+
If it's None, then no unclipping will be performed.
276+
layout_merge_bboxes_mode (Optional[str], optional): The mode for merging bounding boxes. Defaults to None.
277+
text_det_limit_side_len (Optional[int]): Maximum side length for text detection.
278+
text_det_limit_type (Optional[str]): Type of limit to apply for text detection.
279+
text_det_thresh (Optional[float]): Threshold for text detection.
280+
text_det_box_thresh (Optional[float]): Threshold for text detection boxes.
281+
text_det_unclip_ratio (Optional[float]): Ratio for unclipping text detection boxes.
282+
text_rec_score_thresh (Optional[float]): Score threshold for text recognition.
283+
seal_det_limit_side_len (Optional[int]): Maximum side length for seal detection.
284+
seal_det_limit_type (Optional[str]): Type of limit to apply for seal detection.
285+
seal_det_thresh (Optional[float]): Threshold for seal detection.
286+
seal_det_box_thresh (Optional[float]): Threshold for seal detection boxes.
287+
seal_det_unclip_ratio (Optional[float]): Ratio for unclipping seal detection boxes.
288+
seal_rec_score_thresh (Optional[float]): Score threshold for seal recognition.
265289
**kwargs: Additional keyword arguments.
266290
267291
Returns:
@@ -284,6 +308,10 @@ def visual_predict(
284308
use_general_ocr=use_general_ocr,
285309
use_seal_recognition=use_seal_recognition,
286310
use_table_recognition=use_table_recognition,
311+
layout_threshold=layout_threshold,
312+
layout_nms=layout_nms,
313+
layout_unclip_ratio=layout_unclip_ratio,
314+
layout_merge_bboxes_mode=layout_merge_bboxes_mode,
287315
text_det_limit_side_len=text_det_limit_side_len,
288316
text_det_limit_type=text_det_limit_type,
289317
text_det_thresh=text_det_thresh,

0 commit comments

Comments
 (0)