You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
76 lines
2.7 KiB
76 lines
2.7 KiB
# Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved.
|
|
#
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
# you may not use this file except in compliance with the License.
|
|
# You may obtain a copy of the License at
|
|
#
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
#
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
# See the License for the specific language governing permissions and
|
|
# limitations under the License.
|
|
|
|
|
|
class TextDetectionMixin:
|
|
def __init__(
|
|
self,
|
|
*,
|
|
limit_side_len=None,
|
|
limit_type=None,
|
|
thresh=None,
|
|
box_thresh=None,
|
|
unclip_ratio=None,
|
|
input_shape=None,
|
|
**kwargs,
|
|
):
|
|
self._extra_init_args = {
|
|
"limit_side_len": limit_side_len,
|
|
"limit_type": limit_type,
|
|
"thresh": thresh,
|
|
"box_thresh": box_thresh,
|
|
"unclip_ratio": unclip_ratio,
|
|
"input_shape": input_shape,
|
|
}
|
|
super().__init__(**kwargs)
|
|
|
|
def _get_extra_paddlex_predictor_init_args(self):
|
|
return self._extra_init_args
|
|
|
|
|
|
class TextDetectionSubcommandExecutorMixin:
|
|
def _add_text_detection_args(self, subparser):
|
|
subparser.add_argument(
|
|
"--limit_side_len",
|
|
type=int,
|
|
help="This sets a limit on the side length of the input image for the model.",
|
|
)
|
|
subparser.add_argument(
|
|
"--limit_type",
|
|
type=str,
|
|
help="This determines how the side length limit is applied to the input image before feeding it into the model.",
|
|
)
|
|
subparser.add_argument(
|
|
"--thresh",
|
|
type=float,
|
|
help="Detection pixel threshold for the model. Pixels with scores greater than this threshold in the output probability map are considered text pixels.",
|
|
)
|
|
subparser.add_argument(
|
|
"--box_thresh",
|
|
type=float,
|
|
help="Detection box threshold for the model. A detection result is considered a text region if the average score of all pixels within the border of the result is greater than this threshold.",
|
|
)
|
|
subparser.add_argument(
|
|
"--unclip_ratio",
|
|
type=float,
|
|
help="Expansion coefficient, which expands the text region using this method. The larger the value, the larger the expansion area.",
|
|
)
|
|
subparser.add_argument(
|
|
"--input_shape",
|
|
nargs=3,
|
|
type=int,
|
|
metavar=("C", "H", "W"),
|
|
help="Input shape of the model.",
|
|
)
|