há 3 anos atrás · 64c9697a4d
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -1,11 +1,11 @@
 
															 repos:
														
 
															 -   repo: https://github.com/PaddlePaddle/mirrors-yapf.git
														
 
															-    sha: 0d79c0c469bab64f7229c9aca2b1186ef47f0e37
														
 
															+    rev: 0d79c0c469bab64f7229c9aca2b1186ef47f0e37
														
 
															     hooks:
														
 
															     -   id: yapf
														
 
															         files: \.py$
														
 
															 -   repo: https://github.com/pre-commit/pre-commit-hooks
														
 
															-    sha: a11d9314b22d8f8c7556443875b731ef05965464
														
 
															+    rev: a11d9314b22d8f8c7556443875b731ef05965464
														
 
															     hooks:
														
 
															     -   id: check-merge-conflict
														
 
															     -   id: check-symlinks
														
@@ -16,7 +16,7 @@ repos:
 
															     -   id: trailing-whitespace
														
 
															         files: \.md$
														
 
															 -   repo: https://github.com/Lucas-C/pre-commit-hooks
														
 
															-    sha: v1.0.1
														
 
															+    rev: v1.0.1
														
 
															     hooks:
														
 
															     -   id: forbid-crlf
														
 
															         files: \.md$
														
@@ -25,4 +25,4 @@ repos:
 
															     -   id: forbid-tabs
														
 
															         files: \.md$
														
 
															     -   id: remove-tabs
														
 
															-        files: \.md$
														
 
															+        files: \.md$
														
--- a/paddlers/datasets/__init__.py
+++ b/paddlers/datasets/__init__.py
@@ -12,8 +12,8 @@
 
															 # See the License for the specific language governing permissions and
														
 
															 # limitations under the License.
														
 
															-from .voc import VOCDetection
														
 
															-from .coco import COCODetection
														
 
															+from .voc import VOCDetDataset
														
 
															+from .coco import COCODetDataset
														
 
															 from .seg_dataset import SegDataset
														
 
															 from .cd_dataset import CDDataset
														
 
															 from .clas_dataset import ClasDataset
														
--- a/paddlers/datasets/cd_dataset.py
+++ b/paddlers/datasets/cd_dataset.py
@@ -22,28 +22,33 @@ from paddlers.utils import logging, get_encoding, norm_path, is_pic
 
															 class CDDataset(BaseDataset):
														
 
															     """
														
 
															-    读取变化检测任务数据集，并对样本进行相应的处理（来自SegDataset，图像标签需要两个）。
														
 
															+    Dataset for change detection tasks.
														
 
															     Args:
														
 
															-        data_dir (str): 数据集所在的目录路径。
														
 
															-        file_list (str): 描述数据集图片文件和对应标注文件的文件路径（文本内每行路径为相对data_dir的相对路径）。当`with_seg_labels`为
														
 
															-            False（默认设置）时，文件中每一行应依次包含第一时相影像、第二时相影像以及变化检测标签的路径；当`with_seg_labels`为True时，
														
 
															-            文件中每一行应依次包含第一时相影像、第二时相影像、变化检测标签、第一时相建筑物标签以及第二时相建筑物标签的路径。
														
 
															-        label_list (str): 描述数据集包含的类别信息文件路径。默认值为None。
														
 
															-        transforms (paddlers.transforms.Compose): 数据集中每个样本的预处理/增强算子。
														
 
															-        num_workers (int|str): 数据集中样本在预处理过程中的线程或进程数。默认为'auto'。当设为'auto'时，根据
														
 
															-            系统的实际CPU核数设置`num_workers`: 如果CPU核数的一半大于8，则`num_workers`为8，否则为CPU核数的
														
 
															-            一半。
														
 
															-        shuffle (bool): 是否需要对数据集中样本打乱顺序。默认为False。
														
 
															-        with_seg_labels (bool, optional): 数据集中是否包含两个时相的语义分割标签。默认为False。
														
 
															-        binarize_labels (bool, optional): 是否对数据集中的标签进行二值化操作。默认为False。
														
 
															+        data_dir (str): Root directory of the dataset.
														
 
															+        file_list (str): Path of the file that contains relative paths of images and annotation files. When 
														
 
															+            `with_seg_labels` False, each line in the file contains the paths of the bi-temporal images and
														
 
															+            the change mask. When `with_seg_labels` is True, each line in the file contains the paths of the
														
 
															+            bi-temporal images, the path of the change mask, and the paths of the segmentation masks in both
														
 
															+            temporal phases.
														
 
															+        transforms (paddlers.transforms.Compose): Data preprocessing and data augmentation operators to apply.
														
 
															+        label_list (str, optional): Path of the file that contains the category names. Defaults to None.
														
 
															+        num_workers (int|str, optional): Number of processes used for data loading. If `num_workers` is 'auto',
														
 
															+            the number of workers will be automatically determined according to the number of CPU cores: If 
														
 
															+            there are more than 16 cores，8 workers will be used. Otherwise, the number of workers will be half 
														
 
															+            the number of CPU cores. Defaults: 'auto'.
														
 
															+        shuffle (bool, optional): Whether to shuffle the samples. Defaults to False.
														
 
															+        with_seg_labels (bool, optional): Set `with_seg_labels` to True if the datasets provides segmentation 
														
 
															+            masks (e.g., building masks in each temporal phase). Defaults to False.
														
 
															+        binarize_labels (bool, optional): Whether to binarize change masks and segmentation masks. 
														
 
															+            Defaults to False.
														
 
															     """
														
 
															     def __init__(self,
														
 
															                  data_dir,
														
 
															                  file_list,
														
 
															+                 transforms,
														
 
															                  label_list=None,
														
 
															-                 transforms=None,
														
 
															                  num_workers='auto',
														
 
															                  shuffle=False,
														
 
															                  with_seg_labels=False,
														
@@ -64,8 +69,7 @@ class CDDataset(BaseDataset):
 
															             num_items = 3  # RGB1, RGB2, CD
														
 
															         self.binarize_labels = binarize_labels
														
 
															-        # TODO：非None时，让用户跳转数据集分析生成label_list
														
 
															-        # 不要在此处分析label file
														
 
															+        # TODO: If `label_list` is not None, let the user parse `label_list`.
														
 
															         if label_list is not None:
														
 
															             with open(label_list, encoding=get_encoding(label_list)) as f:
														
 
															                 for line in f:
														
@@ -77,7 +81,7 @@ class CDDataset(BaseDataset):
 
															                 items = line.strip().split(DELIMETER)
														
 
															                 if len(items) != num_items:
														
 
															-                    raise Exception(
														
 
															+                    raise ValueError(
														
 
															                         "Line[{}] in file_list[{}] has an incorrect number of file paths.".
														
 
															                         format(line.strip(), file_list))
														
@@ -148,7 +152,10 @@ class CDDataset(BaseDataset):
 
															 class MaskType(IntEnum):
														
 
															-    """Enumeration of the mask types used in the change detection task."""
														
 
															+    """
														
 
															+    Enumeration of the mask types used in the change detection task.
														
 
															+    """
														
 
															+
														
 
															     CD = 0
														
 
															     SEG_T1 = 1
														
 
															     SEG_T2 = 2
														
--- a/paddlers/datasets/clas_dataset.py
+++ b/paddlers/datasets/clas_dataset.py
@@ -19,24 +19,26 @@ from paddlers.utils import logging, get_encoding, norm_path, is_pic
 
															 class ClasDataset(BaseDataset):
														
 
															-    """读取图像分类任务数据集，并对样本进行相应的处理。
														
 
															+    """
														
 
															+    Dataset for scene classification tasks.
														
 
															     Args:
														
 
															-        data_dir (str): 数据集所在的目录路径。
														
 
															-        file_list (str): 描述数据集图片文件和对应标注序号（文本内每行路径为相对data_dir的相对路）。
														
 
															-        label_list (str): 描述数据集包含的类别信息文件路径，文件格式为（类别 说明）。默认值为None。
														
 
															-        transforms (paddlers.transforms.Compose): 数据集中每个样本的预处理/增强算子。
														
 
															-        num_workers (int|str): 数据集中样本在预处理过程中的线程或进程数。默认为'auto'。当设为'auto'时，根据
														
 
															-            系统的实际CPU核数设置`num_workers`: 如果CPU核数的一半大于8，则`num_workers`为8，否则为CPU核数的
														
 
															-            一半。
														
 
															-        shuffle (bool): 是否需要对数据集中样本打乱顺序。默认为False。
														
 
															+        data_dir (str): Root directory of the dataset.
														
 
															+        file_list (str): Path of the file that contains relative paths of images and labels.
														
 
															+        transforms (paddlers.transforms.Compose): Data preprocessing and data augmentation operators to apply.
														
 
															+        label_list (str, optional): Path of the file that contains the category names. Defaults to None.
														
 
															+        num_workers (int|str, optional): Number of processes used for data loading. If `num_workers` is 'auto',
														
 
															+            the number of workers will be automatically determined according to the number of CPU cores: If 
														
 
															+            there are more than 16 cores，8 workers will be used. Otherwise, the number of workers will be half 
														
 
															+            the number of CPU cores. Defaults: 'auto'.
														
 
															+        shuffle (bool, optional): Whether to shuffle the samples. Defaults to False.
														
 
															     """
														
 
															     def __init__(self,
														
 
															                  data_dir,
														
 
															                  file_list,
														
 
															+                 transforms,
														
 
															                  label_list=None,
														
 
															-                 transforms=None,
														
 
															                  num_workers='auto',
														
 
															                  shuffle=False):
														
 
															         super(ClasDataset, self).__init__(data_dir, label_list, transforms,
														
@@ -57,7 +59,7 @@ class ClasDataset(BaseDataset):
 
															             for line in f:
														
 
															                 items = line.strip().split()
														
 
															                 if len(items) > 2:
														
 
															-                    raise Exception(
														
 
															+                    raise ValueError(
														
 
															                         "A space is defined as the delimiter to separate the image and label path, " \
														
 
															                         "so the space cannot be in the image or label path, but the line[{}] of " \
														
 
															                         " file_list[{}] has a space in the image or label path.".format(line, file_list))
														
--- a/paddlers/datasets/coco.py
+++ b/paddlers/datasets/coco.py
@@ -27,29 +27,32 @@ from paddlers.transforms import DecodeImg, MixupImage
 
															 from paddlers.tools import YOLOAnchorCluster
														
 
															-class COCODetection(BaseDataset):
														
 
															-    """读取COCO格式的检测数据集，并对样本进行相应的处理。
														
 
															+class COCODetDataset(BaseDataset):
														
 
															+    """
														
 
															+    Dataset with COCO annotations for detection tasks.
														
 
															     Args:
														
 
															-        data_dir (str): 数据集所在的目录路径。
														
 
															-        image_dir (str): 描述数据集图片文件路径。
														
 
															-        anno_path (str): COCO标注文件路径。
														
 
															-        label_list (str): 描述数据集包含的类别信息文件路径。
														
 
															-        transforms (paddlers.transforms.Compose): 数据集中每个样本的预处理/增强算子。
														
 
															-        num_workers (int|str): 数据集中样本在预处理过程中的线程或进程数。默认为'auto'。当设为'auto'时，根据
														
 
															-            系统的实际CPU核数设置`num_workers`: 如果CPU核数的一半大于8，则`num_workers`为8，否则为CPU核数的
														
 
															-            一半。
														
 
															-        shuffle (bool): 是否需要对数据集中样本打乱顺序。默认为False。
														
 
															-        allow_empty (bool): 是否加载负样本。默认为False。
														
 
															-        empty_ratio (float): 用于指定负样本占总样本数的比例。如果小于0或大于等于1，则保留全部的负样本。默认为1。
														
 
															+        data_dir (str): Root directory of the dataset.
														
 
															+        image_dir (str): Directory that contains the images.
														
 
															+        ann_path (str): Path to COCO annotations.
														
 
															+        transforms (paddlers.transforms.Compose): Data preprocessing and data augmentation operators to apply.
														
 
															+        label_list (str, optional): Path of the file that contains the category names. Defaults to None.
														
 
															+        num_workers (int|str, optional): Number of processes used for data loading. If `num_workers` is 'auto',
														
 
															+            the number of workers will be automatically determined according to the number of CPU cores: If 
														
 
															+            there are more than 16 cores，8 workers will be used. Otherwise, the number of workers will be half 
														
 
															+            the number of CPU cores. Defaults: 'auto'.
														
 
															+        shuffle (bool, optional): Whether to shuffle the samples. Defaults to False.
														
 
															+        allow_empty (bool, optional): Whether to add negative samples. Defaults to False.
														
 
															+        empty_ratio (float, optional): Ratio of negative samples. If `empty_ratio` is smaller than 0 or not less 
														
 
															+            than 1, keep all generated negative samples. Defaults to 1.0.
														
 
															     """
														
 
															     def __init__(self,
														
 
															                  data_dir,
														
 
															                  image_dir,
														
 
															                  anno_path,
														
 
															+                 transforms,
														
 
															                  label_list,
														
 
															-                 transforms=None,
														
 
															                  num_workers='auto',
														
 
															                  shuffle=False,
														
 
															                  allow_empty=False,
														
@@ -60,8 +63,8 @@ class COCODetection(BaseDataset):
 
															         import matplotlib
														
 
															         matplotlib.use('Agg')
														
 
															         from pycocotools.coco import COCO
														
 
															-        super(COCODetection, self).__init__(data_dir, label_list, transforms,
														
 
															-                                            num_workers, shuffle)
														
 
															+        super(COCODetDataset, self).__init__(data_dir, label_list, transforms,
														
 
															+                                             num_workers, shuffle)
														
 
															         self.data_fields = None
														
 
															         self.num_max_boxes = 50
														
@@ -281,15 +284,16 @@ class COCODetection(BaseDataset):
 
															             https://github.com/ultralytics/yolov5/blob/master/utils/autoanchor.py
														
 
															         Args:
														
 
															-            num_anchors (int): number of clusters
														
 
															-            image_size (list or int): [h, w], being an int means image height and image width are the same.
														
 
															-            cache (bool): whether using cache
														
 
															-            cache_path (str or None, optional): cache directory path. If None, use `data_dir` of dataset.
														
 
															-            iters (int, optional): iters of kmeans algorithm
														
 
															-            gen_iters (int, optional): iters of genetic algorithm
														
 
															-            threshold (float, optional): anchor scale threshold
														
 
															-            verbose (bool, optional): whether print results
														
 
															+            num_anchors (int): Number of clusters.
														
 
															+            image_size (list[int]|int): [h, w] or an int value that corresponds to the shape [image_size, image_size].
														
 
															+            cache (bool, optional): Whether to use cache. Defaults to True.
														
 
															+            cache_path (str|None, optional): Path of cache directory. If None, use `dataset.data_dir`. 
														
 
															+                Defaults to None.
														
 
															+            iters (int, optional): Iterations of k-means algorithm. Defaults to 300.
														
 
															+            gen_iters (int, optional): Iterations of genetic algorithm. Defaults to 1000.
														
 
															+            thresh (float, optional): Anchor scale threshold. Defaults to 0.25.
														
 
															         """
														
 
															+
														
 
															         if cache_path is None:
														
 
															             cache_path = self.data_dir
														
 
															         cluster = YOLOAnchorCluster(
														
@@ -305,17 +309,18 @@ class COCODetection(BaseDataset):
 
															         return anchors
														
 
															     def add_negative_samples(self, image_dir, empty_ratio=1):
														
 
															-        """将背景图片加入训练
														
 
															+        """
														
 
															+        Generate and add negative samples.
														
 
															         Args:
														
 
															-            image_dir (str)：背景图片所在的文件夹目录。
														
 
															-            empty_ratio (float or None): 用于指定负样本占总样本数的比例。如果为None，保留数据集初始化是设置的`empty_ratio`值，
														
 
															-                否则更新原有`empty_ratio`值。如果小于0或大于等于1，则保留全部的负样本。默认为1。
														
 
															-
														
 
															+            image_dir (str): Directory that contains images.
														
 
															+            empty_ratio (float|None, optional): Ratio of negative samples. If `empty_ratio` is smaller than
														
 
															+                0 or not less than 1, keep all generated negative samples. Defaults to 1.0.
														
 
															         """
														
 
															+
														
 
															         import cv2
														
 
															         if not osp.isdir(image_dir):
														
 
															-            raise Exception("{} is not a valid image directory.".format(
														
 
															+            raise ValueError("{} is not a valid image directory.".format(
														
 
															                 image_dir))
														
 
															         if empty_ratio is not None:
														
 
															             self.empty_ratio = empty_ratio
														
--- a/paddlers/datasets/seg_dataset.py
+++ b/paddlers/datasets/seg_dataset.py
@@ -20,24 +20,26 @@ from paddlers.utils import logging, get_encoding, norm_path, is_pic
 
															 class SegDataset(BaseDataset):
														
 
															-    """读取语义分割任务数据集，并对样本进行相应的处理。
														
 
															+    """
														
 
															+    Dataset for semantic segmentation tasks.
														
 
															     Args:
														
 
															-        data_dir (str): 数据集所在的目录路径。
														
 
															-        file_list (str): 描述数据集图片文件和对应标注文件的文件路径（文本内每行路径为相对data_dir的相对路）。
														
 
															-        label_list (str): 描述数据集包含的类别信息文件路径。默认值为None。
														
 
															-        transforms (paddlers.transforms.Compose): 数据集中每个样本的预处理/增强算子。
														
 
															-        num_workers (int|str): 数据集中样本在预处理过程中的线程或进程数。默认为'auto'。当设为'auto'时，根据
														
 
															-            系统的实际CPU核数设置`num_workers`: 如果CPU核数的一半大于8，则`num_workers`为8，否则为CPU核数的
														
 
															-            一半。
														
 
															-        shuffle (bool): 是否需要对数据集中样本打乱顺序。默认为False。
														
 
															+        data_dir (str): Root directory of the dataset.
														
 
															+        file_list (str): Path of the file that contains relative paths of images and annotation files.
														
 
															+        transforms (paddlers.transforms.Compose): Data preprocessing and data augmentation operators to apply.
														
 
															+        label_list (str, optional): Path of the file that contains the category names. Defaults to None.
														
 
															+        num_workers (int|str, optional): Number of processes used for data loading. If `num_workers` is 'auto',
														
 
															+            the number of workers will be automatically determined according to the number of CPU cores: If 
														
 
															+            there are more than 16 cores，8 workers will be used. Otherwise, the number of workers will be half 
														
 
															+            the number of CPU cores. Defaults: 'auto'.
														
 
															+        shuffle (bool, optional): Whether to shuffle the samples. Defaults to False.
														
 
															     """
														
 
															     def __init__(self,
														
 
															                  data_dir,
														
 
															                  file_list,
														
 
															+                 transforms,
														
 
															                  label_list=None,
														
 
															-                 transforms=None,
														
 
															                  num_workers='auto',
														
 
															                  shuffle=False):
														
 
															         super(SegDataset, self).__init__(data_dir, label_list, transforms,
														
@@ -58,7 +60,7 @@ class SegDataset(BaseDataset):
 
															             for line in f:
														
 
															                 items = line.strip().split()
														
 
															                 if len(items) > 2:
														
 
															-                    raise Exception(
														
 
															+                    raise ValueError(
														
 
															                         "A space is defined as the delimiter to separate the image and label path, " \
														
 
															                         "so the space cannot be in the image or label path, but the line[{}] of " \
														
 
															                         " file_list[{}] has a space in the image or label path.".format(line, file_list))
														
--- a/paddlers/datasets/voc.py
+++ b/paddlers/datasets/voc.py
@@ -29,27 +29,30 @@ from paddlers.transforms import DecodeImg, MixupImage
 
															 from paddlers.tools import YOLOAnchorCluster
														
 
															-class VOCDetection(BaseDataset):
														
 
															-    """读取PascalVOC格式的检测数据集，并对样本进行相应的处理。
														
 
															+class VOCDetDataset(BaseDataset):
														
 
															+    """
														
 
															+    Dataset with PASCAL VOC annotations for detection tasks.
														
 
															     Args:
														
 
															-        data_dir (str): 数据集所在的目录路径。
														
 
															-        file_list (str): 描述数据集图片文件和对应标注文件的文件路径（文本内每行路径为相对data_dir的相对路）。
														
 
															-        label_list (str): 描述数据集包含的类别信息文件路径。
														
 
															-        transforms (paddlers.transforms.Compose): 数据集中每个样本的预处理/增强算子。
														
 
															-        num_workers (int|str): 数据集中样本在预处理过程中的线程或进程数。默认为'auto'。当设为'auto'时，根据
														
 
															-            系统的实际CPU核数设置`num_workers`: 如果CPU核数的一半大于8，则`num_workers`为8，否则为CPU核数的
														
 
															-            一半。
														
 
															-        shuffle (bool): 是否需要对数据集中样本打乱顺序。默认为False。
														
 
															-        allow_empty (bool): 是否加载负样本。默认为False。
														
 
															-        empty_ratio (float): 用于指定负样本占总样本数的比例。如果小于0或大于等于1，则保留全部的负样本。默认为1。
														
 
															+        data_dir (str): Root directory of the dataset.
														
 
															+        file_list (str): Path of the file that contains relative paths of images and annotation files.
														
 
															+        transforms (paddlers.transforms.Compose): Data preprocessing and data augmentation operators to apply.
														
 
															+        label_list (str, optional): Path of the file that contains the category names. Defaults to None.
														
 
															+        num_workers (int|str, optional): Number of processes used for data loading. If `num_workers` is 'auto',
														
 
															+            the number of workers will be automatically determined according to the number of CPU cores: If 
														
 
															+            there are more than 16 cores，8 workers will be used. Otherwise, the number of workers will be half 
														
 
															+            the number of CPU cores. Defaults: 'auto'.
														
 
															+        shuffle (bool, optional): Whether to shuffle the samples. Defaults to False.
														
 
															+        allow_empty (bool, optional): Whether to add negative samples. Defaults to False.
														
 
															+        empty_ratio (float, optional): Ratio of negative samples. If `empty_ratio` is smaller than 0 or not less 
														
 
															+            than 1, keep all generated negative samples. Defaults to 1.0.
														
 
															     """
														
 
															     def __init__(self,
														
 
															                  data_dir,
														
 
															                  file_list,
														
 
															+                 transforms,
														
 
															                  label_list,
														
 
															-                 transforms=None,
														
 
															                  num_workers='auto',
														
 
															                  shuffle=False,
														
 
															                  allow_empty=False,
														
@@ -60,8 +63,8 @@ class VOCDetection(BaseDataset):
 
															         import matplotlib
														
 
															         matplotlib.use('Agg')
														
 
															         from pycocotools.coco import COCO
														
 
															-        super(VOCDetection, self).__init__(data_dir, label_list, transforms,
														
 
															-                                           num_workers, shuffle)
														
 
															+        super(VOCDetDataset, self).__init__(data_dir, label_list, transforms,
														
 
															+                                            num_workers, shuffle)
														
 
															         self.data_fields = None
														
 
															         self.num_max_boxes = 50
														
@@ -109,9 +112,9 @@ class VOCDetection(BaseDataset):
 
															                 if not line:
														
 
															                     break
														
 
															                 if len(line.strip().split()) > 2:
														
 
															-                    raise Exception("A space is defined as the separator, "
														
 
															-                                    "but it exists in image or label name {}."
														
 
															-                                    .format(line))
														
 
															+                    raise ValueError("A space is defined as the separator, "
														
 
															+                                     "but it exists in image or label name {}."
														
 
															+                                     .format(line))
														
 
															                 img_file, xml_file = [
														
 
															                     osp.join(data_dir, x) for x in line.strip().split()[:2]
														
 
															                 ]
														
@@ -345,15 +348,16 @@ class VOCDetection(BaseDataset):
 
															             https://github.com/ultralytics/yolov5/blob/master/utils/autoanchor.py
														
 
															         Args:
														
 
															-            num_anchors (int): number of clusters
														
 
															-            image_size (list or int): [h, w], being an int means image height and image width are the same.
														
 
															-            cache (bool): whether using cache
														
 
															-            cache_path (str or None, optional): cache directory path. If None, use `data_dir` of dataset.
														
 
															-            iters (int, optional): iters of kmeans algorithm
														
 
															-            gen_iters (int, optional): iters of genetic algorithm
														
 
															-            threshold (float, optional): anchor scale threshold
														
 
															-            verbose (bool, optional): whether print results
														
 
															+            num_anchors (int): Number of clusters.
														
 
															+            image_size (list[int]|int): [h, w] or an int value that corresponds to the shape [image_size, image_size].
														
 
															+            cache (bool, optional): Whether to use cache. Defaults to True.
														
 
															+            cache_path (str|None, optional): Path of cache directory. If None, use `dataset.data_dir`. 
														
 
															+                Defaults to None.
														
 
															+            iters (int, optional): Iterations of k-means algorithm. Defaults to 300.
														
 
															+            gen_iters (int, optional): Iterations of genetic algorithm. Defaults to 1000.
														
 
															+            thresh (float, optional): Anchor scale threshold. Defaults to 0.25.
														
 
															         """
														
 
															+
														
 
															         if cache_path is None:
														
 
															             cache_path = self.data_dir
														
 
															         cluster = YOLOAnchorCluster(
														
@@ -369,17 +373,18 @@ class VOCDetection(BaseDataset):
 
															         return anchors
														
 
															     def add_negative_samples(self, image_dir, empty_ratio=1):
														
 
															-        """将背景图片加入训练
														
 
															+        """
														
 
															+        Generate and add negative samples.
														
 
															         Args:
														
 
															-            image_dir (str)：背景图片所在的文件夹目录。
														
 
															-            empty_ratio (float or None): 用于指定负样本占总样本数的比例。如果为None，保留数据集初始化是设置的`empty_ratio`值，
														
 
															-                否则更新原有`empty_ratio`值。如果小于0或大于等于1，则保留全部的负样本。默认为1。
														
 
															-
														
 
															+            image_dir (str): Directory that contains images.
														
 
															+            empty_ratio (float|None, optional): Ratio of negative samples. If `empty_ratio` is smaller than
														
 
															+                0 or not less than 1, keep all generated negative samples. Defaults to 1.0.
														
 
															         """
														
 
															+
														
 
															         import cv2
														
 
															         if not osp.isdir(image_dir):
														
 
															-            raise Exception("{} is not a valid image directory.".format(
														
 
															+            raise ValueError("{} is not a valid image directory.".format(
														
 
															                 image_dir))
														
 
															         if empty_ratio is not None:
														
 
															             self.empty_ratio = empty_ratio
														
--- a/paddlers/deploy/predictor.py
+++ b/paddlers/deploy/predictor.py
@@ -39,20 +39,20 @@ class Predictor(object):
 
															                  max_trt_batch_size=1,
														
 
															                  trt_precision_mode='float32'):
														
 
															         """ 
														
 
															-        创建Paddle Predictor
														
 
															-
														
 
															         Args:
														
 
															-            model_dir: 模型路径（必须是导出的部署或量化模型）。
														
 
															-            use_gpu: 是否使用GPU，默认为False。
														
 
															-            gpu_id: 使用GPU的ID，默认为0。
														
 
															-            cpu_thread_num：使用cpu进行预测时的线程数，默认为1。
														
 
															-            use_mkl: 是否使用mkldnn计算库，CPU情况下使用，默认为False。
														
 
															-            mkl_thread_num: mkldnn计算线程数，默认为4。
														
 
															-            use_trt: 是否使用TensorRT，默认为False。
														
 
															-            use_glog: 是否启用glog日志, 默认为False。
														
 
															-            memory_optimize: 是否启动内存优化，默认为True。
														
 
															-            max_trt_batch_size: 在使用TensorRT时配置的最大batch size，默认为1。
														
 
															-            trt_precision_mode：在使用TensorRT时采用的精度，可选值['float32', 'float16']。默认为'float32'。
														
 
															+            model_dir (str): Path of the exported model.
														
 
															+            use_gpu (bool, optional): Whether to use a GPU. Defaults to False.
														
 
															+            gpu_id (int, optional): GPU ID. Defaults to 0.
														
 
															+            cpu_thread_num (int, optional): Number of threads to use when making predictions using CPUs. 
														
 
															+                Defaults to 1.
														
 
															+            use_mkl (bool, optional): Whether to use MKL-DNN. Defaults to False.
														
 
															+            mkl_thread_num (int, optional): Number of MKL threads. Defaults to 4.
														
 
															+            use_trt (bool, optional): Whether to use TensorRT. Defaults to False.
														
 
															+            use_glog (bool, optional): Whether to enable glog logs. Defaults to False.
														
 
															+            memory_optimize (bool, optional): Whether to enable memory optimization. Defaults to True.
														
 
															+            max_trt_batch_size (int, optional): Maximum batch size when configured with TensorRT. Defaults to 1.
														
 
															+            trt_precision_mode (str, optional)：Precision to use when configured with TensorRT. Possible values 
														
 
															+                are {'float32', 'float16'}. Defaults to 'float32'.
														
 
															         """
														
 
															         self.model_dir = model_dir
														
@@ -209,10 +209,13 @@ class Predictor(object):
 
															         return preds
														
 
															     def raw_predict(self, inputs):
														
 
															-        """ 接受预处理过后的数据进行预测
														
 
															-            Args:
														
 
															-                inputs(dict): 预处理过后的数据
														
 
															+        """ 
														
 
															+        Predict according to preprocessed inputs.
														
 
															+
														
 
															+        Args:
														
 
															+            inputs (dict): Preprocessed inputs.
														
 
															         """
														
 
															+
														
 
															         input_names = self.predictor.get_input_names()
														
 
															         for name in input_names:
														
 
															             input_tensor = self.predictor.get_input_handle(name)
														
@@ -253,21 +256,22 @@ class Predictor(object):
 
															                 warmup_iters=0,
														
 
															                 repeats=1):
														
 
															         """
														
 
															-            Do prediction.
														
 
															-
														
 
															-            Args:
														
 
															-                img_file(list[str | tuple | np.ndarray] | str | tuple | np.ndarray): For scene classification, image restoration, 
														
 
															-                    object detection and semantic segmentation tasks, `img_file` should be either the path of the image to predict
														
 
															-                    , a decoded image (a np.ndarray, which should be consistent with what you get from passing image path to
														
 
															-                    paddlers.transforms.decode_image()), or a list of image paths or decoded images. For change detection tasks,
														
 
															-                    img_file should be a tuple of image paths, a tuple of decoded images, or a list of tuples.
														
 
															-                topk(int, optional): Top-k values to reserve in a classification result. Defaults to 1.
														
 
															-                transforms (paddlers.transforms.Compose | None, optional): Pipeline of data preprocessing. If None, load transforms
														
 
															-                    from `model.yml`. Defaults to None.
														
 
															-                warmup_iters (int, optional): Warm-up iterations before measuring the execution time. Defaults to 0.
														
 
															-                repeats (int, optional): Number of repetitions to evaluate model inference and data processing speed. If greater than
														
 
															-                    1, the reported time consumption is the average of all repeats. Defaults to 1.
														
 
															+        Do prediction.
														
 
															+
														
 
															+        Args:
														
 
															+            img_file(list[str|tuple|np.ndarray] | str | tuple | np.ndarray): For scene classification, image restoration, 
														
 
															+                object detection and semantic segmentation tasks, `img_file` should be either the path of the image to predict
														
 
															+                , a decoded image (a np.ndarray, which should be consistent with what you get from passing image path to
														
 
															+                paddlers.transforms.decode_image()), or a list of image paths or decoded images. For change detection tasks,
														
 
															+                img_file should be a tuple of image paths, a tuple of decoded images, or a list of tuples.
														
 
															+            topk(int, optional): Top-k values to reserve in a classification result. Defaults to 1.
														
 
															+            transforms (paddlers.transforms.Compose|None, optional): Pipeline of data preprocessing. If None, load transforms
														
 
															+                from `model.yml`. Defaults to None.
														
 
															+            warmup_iters (int, optional): Warm-up iterations before measuring the execution time. Defaults to 0.
														
 
															+            repeats (int, optional): Number of repetitions to evaluate model inference and data processing speed. If greater than
														
 
															+                1, the reported time consumption is the average of all repeats. Defaults to 1.
														
 
															         """
														
 
															+
														
 
															         if repeats < 1:
														
 
															             logging.error("`repeats` must be greater than 1.", exit=True)
														
 
															         if transforms is None and not hasattr(self._model, 'test_transforms'):
														
--- a/paddlers/rs_models/cd/backbones/resnet.py
+++ b/paddlers/rs_models/cd/backbones/resnet.py
@@ -162,14 +162,17 @@ class BottleneckBlock(nn.Layer):
 
															 class ResNet(nn.Layer):
														
 
															-    """ResNet model from
														
 
															-    `"Deep Residual Learning for Image Recognition" <https://arxiv.org/pdf/1512.03385.pdf>`_
														
 
															+    """
														
 
															+    ResNet model from "Deep Residual Learning for Image Recognition" 
														
 
															+        (https://arxiv.org/pdf/1512.03385.pdf)
														
 
															+    
														
 
															     Args:
														
 
															         Block (BasicBlock|BottleneckBlock): block module of model.
														
 
															         depth (int): layers of resnet, default: 50.
														
 
															-        num_classes (int): output dim of last fc layer. If num_classes <=0, last fc layer 
														
 
															-                            will not be defined. Default: 1000.
														
 
															+        num_classes (int): output dim of last fc layer. If num_classes <=0, last fc 
														
 
															+            layer will not be defined. Default: 1000.
														
 
															         with_pool (bool): use pool before the last fc layer or not. Default: True.
														
 
															+    
														
 
															     Examples:
														
 
															         .. code-block:: python
														
 
															             from paddle.vision.models import ResNet
														
@@ -283,7 +286,8 @@ def _resnet(arch, Block, depth, pretrained, **kwargs):
 
															 def resnet18(pretrained=False, **kwargs):
														
 
															-    """ResNet 18-layer model
														
 
															+    """
														
 
															+    ResNet 18-layer model
														
 
															     Args:
														
 
															         pretrained (bool): If True, returns a model pre-trained on ImageNet
														
@@ -299,7 +303,8 @@ def resnet18(pretrained=False, **kwargs):
 
															 def resnet34(pretrained=False, **kwargs):
														
 
															-    """ResNet 34-layer model
														
 
															+    """
														
 
															+    ResNet 34-layer model
														
 
															     Args:
														
 
															         pretrained (bool): If True, returns a model pre-trained on ImageNet
														
@@ -316,10 +321,12 @@ def resnet34(pretrained=False, **kwargs):
 
															 def resnet50(pretrained=False, **kwargs):
														
 
															-    """ResNet 50-layer model
														
 
															+    """
														
 
															+    ResNet 50-layer model
														
 
															     Args:
														
 
															         pretrained (bool): If True, returns a model pre-trained on ImageNet
														
 
															+
														
 
															     Examples:
														
 
															         .. code-block:: python
														
 
															             from paddle.vision.models import resnet50
														
@@ -332,10 +339,12 @@ def resnet50(pretrained=False, **kwargs):
 
															 def resnet101(pretrained=False, **kwargs):
														
 
															-    """ResNet 101-layer model
														
 
															+    """
														
 
															+    ResNet 101-layer model
														
 
															     Args:
														
 
															         pretrained (bool): If True, returns a model pre-trained on ImageNet
														
 
															+
														
 
															     Examples:
														
 
															         .. code-block:: python
														
 
															             from paddle.vision.models import resnet101
														
@@ -348,10 +357,12 @@ def resnet101(pretrained=False, **kwargs):
 
															 def resnet152(pretrained=False, **kwargs):
														
 
															-    """ResNet 152-layer model
														
 
															+    """
														
 
															+    ResNet 152-layer model
														
 
															     Args:
														
 
															         pretrained (bool): If True, returns a model pre-trained on ImageNet
														
 
															+        
														
 
															     Examples:
														
 
															         .. code-block:: python
														
 
															             from paddle.vision.models import resnet152
														
--- a/paddlers/rs_models/cd/bit.py
+++ b/paddlers/rs_models/cd/bit.py
@@ -42,24 +42,24 @@ class BIT(nn.Layer):
 
															     This implementation adopts pretrained encoders, as opposed to the original work where weights are randomly initialized.
														
 
															     Args:
														
 
															-        in_channels (int): The number of bands of the input images.
														
 
															-        num_classes (int): The number of target classes.
														
 
															+        in_channels (int): Number of bands of the input images.
														
 
															+        num_classes (int): Number of target classes.
														
 
															         backbone (str, optional): The ResNet architecture that is used as the backbone. Currently, only 'resnet18' and 
														
 
															             'resnet34' are supported. Default: 'resnet18'.
														
 
															-        n_stages (int, optional): The number of ResNet stages used in the backbone, which should be a value in {3,4,5}. 
														
 
															+        n_stages (int, optional): Number of ResNet stages used in the backbone, which should be a value in {3,4,5}. 
														
 
															             Default: 4.
														
 
															         use_tokenizer (bool, optional): Use a tokenizer or not. Default: True.
														
 
															-        token_len (int, optional): The length of input tokens. Default: 4.
														
 
															+        token_len (int, optional): Length of input tokens. Default: 4.
														
 
															         pool_mode (str, optional): The pooling strategy to obtain input tokens when `use_tokenizer` is set to False. 'max'
														
 
															             for global max pooling and 'avg' for global average pooling. Default: 'max'.
														
 
															-        pool_size (int, optional): The height and width of the pooled feature maps when `use_tokenizer` is set to False. 
														
 
															+        pool_size (int, optional): Height and width of the pooled feature maps when `use_tokenizer` is set to False. 
														
 
															             Default: 2.
														
 
															         enc_with_pos (bool, optional): Whether to add leanred positional embedding to the input feature sequence of the 
														
 
															             encoder. Default: True.
														
 
															-        enc_depth (int, optional): The number of attention blocks used in the encoder. Default: 1
														
 
															-        enc_head_dim (int, optional): The embedding dimension of each encoder head. Default: 64.
														
 
															-        dec_depth (int, optional): The number of attention blocks used in the decoder. Default: 8.
														
 
															-        dec_head_dim (int, optional): The embedding dimension of each decoder head. Default: 8.
														
 
															+        enc_depth (int, optional): Number of attention blocks used in the encoder. Default: 1
														
 
															+        enc_head_dim (int, optional): Embedding dimension of each encoder head. Default: 64.
														
 
															+        dec_depth (int, optional): Number of attention blocks used in the decoder. Default: 8.
														
 
															+        dec_head_dim (int, optional): Embedding dimension of each decoder head. Default: 8.
														
 
															     Raises:
														
 
															         ValueError: When an unsupported backbone type is specified, or the number of backbone stages is not 3, 4, or 5.
														
--- a/paddlers/rs_models/cd/cdnet.py
+++ b/paddlers/rs_models/cd/cdnet.py
@@ -15,8 +15,23 @@
 
															 import paddle

														
 
															 import paddle.nn as nn

														
 
															+from .layers import Conv7x7

														
 
															+

														
 
															 class CDNet(nn.Layer):

														
 
															+    """

														
 
															+    The CDNet implementation based on PaddlePaddle.

														
 
															+

														
 
															+    The original article refers to

														
 
															+        Pablo F. Alcantarilla, et al., "Street-View Change Detection with Deconvolut

														
 
															+        ional Networks"

														
 
															+        (https://link.springer.com/article/10.1007/s10514-018-9734-5).

														
 
															+

														
 
															+    Args:

														
 
															+        in_channels (int): Number of bands of the input images.

														
 
															+        num_classes (int): Number of target classes.

														
 
															+    """

														
 
															+

														
 
															     def __init__(self, in_channels=6, num_classes=2):

														
 
															         super(CDNet, self).__init__()

														
 
															         self.conv1 = Conv7x7(in_channels, 64, norm=True, act=True)

														
@@ -48,28 +63,3 @@ class CDNet(nn.Layer):
 
															         x = self.conv7(self.upool2(x, ind2))

														
 
															         x = self.conv8(self.upool1(x, ind1))

														
 
															         return [self.conv_out(x)]

														
 
															-

														
 
															-

														
 
															-class Conv7x7(nn.Layer):

														
 
															-    def __init__(self, in_ch, out_ch, norm=False, act=False):

														
 
															-        super(Conv7x7, self).__init__()

														
 
															-        layers = [

														
 
															-            nn.Pad2D(3), nn.Conv2D(

														
 
															-                in_ch, out_ch, 7, bias_attr=(False if norm else None))

														
 
															-        ]

														
 
															-        if norm:

														
 
															-            layers.append(nn.BatchNorm2D(out_ch))

														
 
															-        if act:

														
 
															-            layers.append(nn.ReLU())

														
 
															-        self.layers = nn.Sequential(*layers)

														
 
															-

														
 
															-    def forward(self, x):

														
 
															-        return self.layers(x)

														
 
															-

														
 
															-

														
 
															-if __name__ == "__main__":

														
 
															-    t1 = paddle.randn((1, 3, 512, 512), dtype="float32")

														
 
															-    t2 = paddle.randn((1, 3, 512, 512), dtype="float32")

														
 
															-    model = CDNet(6, 2)

														
 
															-    pred = model(t1, t2)[0]

														
 
															-    print(pred.shape)

														
--- a/paddlers/rs_models/cd/changestar.py
+++ b/paddlers/rs_models/cd/changestar.py
@@ -86,7 +86,8 @@ class ChangeStar_FarSeg(_ChangeStarBase):
 
															     The ChangeStar implementation with a FarSeg encoder based on PaddlePaddle.
														
 
															     The original article refers to
														
 
															-        Z. Zheng, et al., "Change is Everywhere: Single-Temporal Supervised Object Change Detection in Remote Sensing Imagery"
														
 
															+        Z. Zheng, et al., "Change is Everywhere: Single-Temporal Supervised Object 
														
 
															+        Change Detection in Remote Sensing Imagery"
														
 
															         (https://arxiv.org/abs/2108.07002).
														
 
															     Note that this implementation differs from the original code in two aspects:
														
@@ -94,12 +95,15 @@ class ChangeStar_FarSeg(_ChangeStarBase):
 
															     2. We use conv-bn-relu instead of conv-relu-bn.
														
 
															     Args:
														
 
															-        num_classes (int): The number of target classes.
														
 
															-        mid_channels (int, optional): The number of channels required by the ChangeMixin module. Default: 256.
														
 
															-        inner_channels (int, optional): The number of filters used in the convolutional layers in the ChangeMixin module. 
														
 
															-            Default: 16.
														
 
															-        num_convs (int, optional): The number of convolutional layers used in the ChangeMixin module. Default: 4.
														
 
															-        scale_factor (float, optional): The scaling factor of the output upsampling layer. Default: 4.0.
														
 
															+        num_classes (int): Number of target classes.
														
 
															+        mid_channels (int, optional): Number of channels required by the 
														
 
															+        ChangeMixin module. Default: 256.
														
 
															+        inner_channels (int, optional): Number of filters used in the 
														
 
															+            convolutional layers in the ChangeMixin module. Default: 16.
														
 
															+        num_convs (int, optional): Number of convolutional layers used in the 
														
 
															+            ChangeMixin module. Default: 4.
														
 
															+        scale_factor (float, optional): Scaling factor of the output upsampling 
														
 
															+            layer. Default: 4.0.
														
 
															     """
														
 
															     def __init__(
														
--- a/paddlers/rs_models/cd/dsamnet.py
+++ b/paddlers/rs_models/cd/dsamnet.py
@@ -25,19 +25,22 @@ class DSAMNet(nn.Layer):
 
															     The DSAMNet implementation based on PaddlePaddle.
														
 
															     The original article refers to
														
 
															-        Q. Shi, et al., "A Deeply Supervised Attention Metric-Based Network and an Open Aerial Image Dataset for Remote Sensing 
														
 
															-        Change Detection"
														
 
															+        Q. Shi, et al., "A Deeply Supervised Attention Metric-Based Network and an 
														
 
															+        Open Aerial Image Dataset for Remote Sensing Change Detection"
														
 
															         (https://ieeexplore.ieee.org/document/9467555).
														
 
															     Note that this implementation differs from the original work in two aspects:
														
 
															     1. We do not use multiple dilation rates in layer 4 of the ResNet backbone.
														
 
															-    2. A classification head is used in place of the original metric learning-based head to stablize the training process.
														
 
															+    2. A classification head is used in place of the original metric learning-based 
														
 
															+        head to stablize the training process.
														
 
															     Args:
														
 
															-        in_channels (int): The number of bands of the input images.
														
 
															-        num_classes (int): The number of target classes.
														
 
															-        ca_ratio (int, optional): The channel reduction ratio for the channel attention module. Default: 8.
														
 
															-        sa_kernel (int, optional): The size of the convolutional kernel used in the spatial attention module. Default: 7.
														
 
															+        in_channels (int): Number of bands of the input images.
														
 
															+        num_classes (int): Number of target classes.
														
 
															+        ca_ratio (int, optional): Channel reduction ratio for the channel 
														
 
															+            attention module. Default: 8.
														
 
															+        sa_kernel (int, optional): Size of the convolutional kernel used in the 
														
 
															+            spatial attention module. Default: 7.
														
 
															     """
														
 
															     def __init__(self, in_channels, num_classes, ca_ratio=8, sa_kernel=7):
														
--- a/paddlers/rs_models/cd/dsifn.py
+++ b/paddlers/rs_models/cd/dsifn.py
@@ -28,16 +28,17 @@ class DSIFN(nn.Layer):
 
															     The DSIFN implementation based on PaddlePaddle.
														
 
															     The original article refers to
														
 
															-        C. Zhang, et al., "A deeply supervised image fusion network for change detection in high resolution bi-temporal remote 
														
 
															-        sensing images"
														
 
															+        C. Zhang, et al., "A deeply supervised image fusion network for change 
														
 
															+        detection in high resolution bi-temporal remote sensing images"
														
 
															         (https://www.sciencedirect.com/science/article/pii/S0924271620301532).
														
 
															     Note that in this implementation, there is a flexible number of target classes.
														
 
															     Args:
														
 
															-        num_classes (int): The number of target classes.
														
 
															-        use_dropout (bool, optional): A bool value that indicates whether to use dropout layers. When the model is trained 
														
 
															-            on a relatively small dataset, the dropout layers help prevent overfitting. Default: False.
														
 
															+        num_classes (int): Number of target classes.
														
 
															+        use_dropout (bool, optional): A bool value that indicates whether to use 
														
 
															+            dropout layers. When the model is trained on a relatively small dataset, 
														
 
															+            the dropout layers help prevent overfitting. Default: False.
														
 
															     """
														
 
															     def __init__(self, num_classes, use_dropout=False):
														
--- a/paddlers/rs_models/cd/fc_ef.py
+++ b/paddlers/rs_models/cd/fc_ef.py
@@ -26,14 +26,16 @@ class FCEarlyFusion(nn.Layer):
 
															     The FC-EF implementation based on PaddlePaddle.
														
 
															     The original article refers to
														
 
															-        Caye Daudt, R., et al. "Fully convolutional siamese networks for change detection"
														
 
															+        Rodrigo Caye Daudt, et al. "Fully convolutional siamese networks for change 
														
 
															+        detection"
														
 
															         (https://arxiv.org/abs/1810.08462).
														
 
															     Args:
														
 
															-        in_channels (int): The number of bands of the input images.
														
 
															-        num_classes (int): The number of target classes.
														
 
															-        use_dropout (bool, optional): A bool value that indicates whether to use dropout layers. When the model is trained 
														
 
															-            on a relatively small dataset, the dropout layers help prevent overfitting. Default: False.
														
 
															+        in_channels (int): Number of bands of the input images.
														
 
															+        num_classes (int): Number of target classes.
														
 
															+        use_dropout (bool, optional): A bool value that indicates whether to use 
														
 
															+            dropout layers. When the model is trained on a relatively small dataset, 
														
 
															+            the dropout layers help prevent overfitting. Default: False.
														
 
															     """
														
 
															     def __init__(self, in_channels, num_classes, use_dropout=False):
														
--- a/paddlers/rs_models/cd/fc_siam_conc.py
+++ b/paddlers/rs_models/cd/fc_siam_conc.py
@@ -26,14 +26,16 @@ class FCSiamConc(nn.Layer):
 
															     The FC-Siam-conc implementation based on PaddlePaddle.
														
 
															     The original article refers to
														
 
															-        Caye Daudt, R., et al. "Fully convolutional siamese networks for change detection"
														
 
															+        Rodrigo Caye Daudt, et al. "Fully convolutional siamese networks for change 
														
 
															+        detection"
														
 
															         (https://arxiv.org/abs/1810.08462).
														
 
															     Args:
														
 
															-        in_channels (int): The number of bands of the input images.
														
 
															-        num_classes (int): The number of target classes.
														
 
															-        use_dropout (bool, optional): A bool value that indicates whether to use dropout layers. When the model is trained 
														
 
															-            on a relatively small dataset, the dropout layers help prevent overfitting. Default: False.
														
 
															+        in_channels (int): Number of bands of the input images.
														
 
															+        num_classes (int): Number of target classes.
														
 
															+        use_dropout (bool, optional): A bool value that indicates whether to use 
														
 
															+            dropout layers. When the model is trained on a relatively small dataset, 
														
 
															+            the dropout layers help prevent overfitting. Default: False.
														
 
															     """
														
 
															     def __init__(self, in_channels, num_classes, use_dropout=False):
														
--- a/paddlers/rs_models/cd/fc_siam_diff.py
+++ b/paddlers/rs_models/cd/fc_siam_diff.py
@@ -26,14 +26,16 @@ class FCSiamDiff(nn.Layer):
 
															     The FC-Siam-diff implementation based on PaddlePaddle.
														
 
															     The original article refers to
														
 
															-        Caye Daudt, R., et al. "Fully convolutional siamese networks for change detection"
														
 
															+        Rodrigo Caye Daudt, et al. "Fully convolutional siamese networks for change 
														
 
															+        detection"
														
 
															         (https://arxiv.org/abs/1810.08462).
														
 
															     Args:
														
 
															-        in_channels (int): The number of bands of the input images.
														
 
															-        num_classes (int): The number of target classes.
														
 
															-        use_dropout (bool, optional): A bool value that indicates whether to use dropout layers. When the model is trained 
														
 
															-            on a relatively small dataset, the dropout layers help prevent overfitting. Default: False.
														
 
															+        in_channels (int): Number of bands of the input images.
														
 
															+        num_classes (int): Number of target classes.
														
 
															+        use_dropout (bool, optional): A bool value that indicates whether to use 
														
 
															+            dropout layers. When the model is trained on a relatively small dataset, 
														
 
															+            the dropout layers help prevent overfitting. Default: False.
														
 
															     """
														
 
															     def __init__(self, in_channels, num_classes, use_dropout=False):
														
--- a/paddlers/rs_models/cd/layers/attention.py
+++ b/paddlers/rs_models/cd/layers/attention.py
@@ -28,8 +28,8 @@ class ChannelAttention(nn.Layer):
 
															         (https://arxiv.org/abs/1807.06521).
														
 
															     Args:
														
 
															-        in_ch (int): The number of channels of the input features.
														
 
															-        ratio (int, optional): The channel reduction ratio. Default: 8.
														
 
															+        in_ch (int): Number of channels of the input features.
														
 
															+        ratio (int, optional): Channel reduction ratio. Default: 8.
														
 
															     """
														
 
															     def __init__(self, in_ch, ratio=8):
														
@@ -55,7 +55,8 @@ class SpatialAttention(nn.Layer):
 
															         (https://arxiv.org/abs/1807.06521).
														
 
															     Args:
														
 
															-        kernel_size (int, optional): The size of the convolutional kernel. Default: 7.
														
 
															+        kernel_size (int, optional): Size of the convolutional kernel. 
														
 
															+            Default: 7.
														
 
															     """
														
 
															     def __init__(self, kernel_size=7):
														
@@ -79,9 +80,11 @@ class CBAM(nn.Layer):
 
															         (https://arxiv.org/abs/1807.06521).
														
 
															     Args:
														
 
															-        in_ch (int): The number of channels of the input features.
														
 
															-        ratio (int, optional): The channel reduction ratio for the channel attention module. Default: 8.
														
 
															-        kernel_size (int, optional): The size of the convolutional kernel used in the spatial attention module. Default: 7.
														
 
															+        in_ch (int): Number of channels of the input features.
														
 
															+        ratio (int, optional): Channel reduction ratio for the channel 
														
 
															+            attention module. Default: 8.
														
 
															+        kernel_size (int, optional): Size of the convolutional kernel used in 
														
 
															+            the spatial attention module. Default: 7.
														
 
															     """
														
 
															     def __init__(self, in_ch, ratio=8, kernel_size=7):
														
--- a/paddlers/rs_models/cd/layers/blocks.py
+++ b/paddlers/rs_models/cd/layers/blocks.py
@@ -184,7 +184,9 @@ class ConvTransposed3x3(nn.Layer):
 
															 class Identity(nn.Layer):
														
 
															-    """A placeholder identity operator that accepts exactly one argument."""
														
 
															+    """
														
 
															+    A placeholder identity operator that accepts exactly one argument.
														
 
															+    """
														
 
															     def __init__(self, *args, **kwargs):
														
 
															         super(Identity, self).__init__()
														
--- a/paddlers/rs_models/cd/snunet.py
+++ b/paddlers/rs_models/cd/snunet.py
@@ -27,15 +27,18 @@ class SNUNet(nn.Layer, KaimingInitMixin):
 
															     The SNUNet implementation based on PaddlePaddle.
														
 
															     The original article refers to
														
 
															-        S. Fang, et al., "SNUNet-CD: A Densely Connected Siamese Network for Change Detection of VHR Images"
														
 
															+        S. Fang, et al., "SNUNet-CD: A Densely Connected Siamese Network for Change 
														
 
															+        Detection of VHR Images"
														
 
															         (https://ieeexplore.ieee.org/document/9355573).
														
 
															-    Note that bilinear interpolation is adopted as the upsampling method, which is different from the paper.
														
 
															+    Note that bilinear interpolation is adopted as the upsampling method, which is 
														
 
															+        different from the paper.
														
 
															     Args:
														
 
															-        in_channels (int): The number of bands of the input images.
														
 
															-        num_classes (int): The number of target classes.
														
 
															-        width (int, optional): The output channels of the first convolutional layer. Default: 32.
														
 
															+        in_channels (int): Number of bands of the input images.
														
 
															+        num_classes (int): Number of target classes.
														
 
															+        width (int, optional): Output channels of the first convolutional layer. 
														
 
															+            Default: 32.
														
 
															     """
														
 
															     def __init__(self, in_channels, num_classes, width=32):
														
--- a/paddlers/rs_models/cd/stanet.py
+++ b/paddlers/rs_models/cd/stanet.py
@@ -26,23 +26,29 @@ class STANet(nn.Layer):
 
															     The STANet implementation based on PaddlePaddle.
														
 
															     The original article refers to
														
 
															-        H. Chen and Z. Shi, "A Spatial-Temporal Attention-Based Method and a New Dataset for Remote Sensing Image Change Detection"
														
 
															+        H. Chen and Z. Shi, "A Spatial-Temporal Attention-Based Method and a New 
														
 
															+        Dataset for Remote Sensing Image Change Detection"
														
 
															         (https://www.mdpi.com/2072-4292/12/10/1662).
														
 
															     Note that this implementation differs from the original work in two aspects:
														
 
															     1. We do not use multiple dilation rates in layer 4 of the ResNet backbone.
														
 
															-    2. A classification head is used in place of the original metric learning-based head to stablize the training process.
														
 
															+    2. A classification head is used in place of the original metric learning-based 
														
 
															+        head to stablize the training process.
														
 
															     Args:
														
 
															-        in_channels (int): The number of bands of the input images.
														
 
															-        num_classes (int): The number of target classes.
														
 
															-        att_type (str, optional): The attention module used in the model. Options are 'PAM' and 'BAM'. Default: 'BAM'.
														
 
															-        ds_factor (int, optional): The downsampling factor of the attention modules. When `ds_factor` is set to values 
														
 
															-            greater than 1, the input features will first be processed by an average pooling layer with the kernel size of 
														
 
															-            `ds_factor`, before being used to calculate the attention scores. Default: 1.
														
 
															+        in_channels (int): Number of bands of the input images.
														
 
															+        num_classes (int): Number of target classes.
														
 
															+        att_type (str, optional): The attention module used in the model. Options 
														
 
															+            are 'PAM' and 'BAM'. Default: 'BAM'.
														
 
															+        ds_factor (int, optional): Downsampling factor of the attention modules. 
														
 
															+            When `ds_factor` is set to values greater than 1, the input features 
														
 
															+            will first be processed by an average pooling layer with the kernel size 
														
 
															+            of `ds_factor`, before being used to calculate the attention scores. 
														
 
															+            Default: 1.
														
 
															     Raises:
														
 
															-        ValueError: When `att_type` has an illeagal value (unsupported attention type).
														
 
															+        ValueError: When `att_type` has an illeagal value (unsupported attention 
														
 
															+            type).
														
 
															     """
														
 
															     def __init__(self, in_channels, num_classes, att_type='BAM', ds_factor=1):
														
--- a/paddlers/rs_models/res/rcan_model.py
+++ b/paddlers/rs_models/res/rcan_model.py
@@ -25,7 +25,8 @@ from ...models.ppgan.modules.init import reset_parameters
 
															 @MODELS.register()
														
 
															 class RCANModel(BaseModel):
														
 
															-    """Base SR model for single image super-resolution.
														
 
															+    """
														
 
															+    Base SR model for single image super-resolution.
														
 
															     """
														
 
															     def __init__(self, generator, pixel_criterion=None, use_init_weight=False):
														
--- a/paddlers/rs_models/seg/farseg.py
+++ b/paddlers/rs_models/seg/farseg.py
@@ -32,7 +32,7 @@ class FPN(nn.Layer):
 
															     """

														
 
															     Module that adds FPN on top of a list of feature maps.

														
 
															     The feature maps are currently supposed to be in increasing depth

														
 
															-        order, and must be consecutive

														
 
															+        order, and must be consecutive.

														
 
															     """

														
 
															     def __init__(self,

														
@@ -233,13 +233,14 @@ class ResNet50Encoder(nn.Layer):
 
															 class FarSeg(nn.Layer):

														
 
															-    '''

														
 
															+    """

														
 
															         The FarSeg implementation based on PaddlePaddle.

														
 
															         The original article refers to

														
 
															-        Zheng, Zhuo, et al. "Foreground-Aware Relation Network for Geospatial Object Segmentation in High Spatial Resolution Remote Sensing Imagery"

														
 
															+        Zheng, Zhuo, et al. "Foreground-Aware Relation Network for Geospatial Object 

														
 
															+            Segmentation in High Spatial Resolution Remote Sensing Imagery"

														
 
															         (https://openaccess.thecvf.com/content_CVPR_2020/papers/Zheng_Foreground-Aware_Relation_Network_for_Geospatial_Object_Segmentation_in_High_Spatial_CVPR_2020_paper.pdf)

														
 
															-    '''

														
 
															+    """

														
 
															     def __init__(self,

														
 
															                  num_classes=16,

														
--- a/paddlers/rs_models/seg/layers/layers_lib.py
+++ b/paddlers/rs_models/seg/layers/layers_lib.py
@@ -96,16 +96,17 @@ class Activation(nn.Layer):
 
															     """

														
 
															     The wrapper of activations.

														
 
															     Args:

														
 
															-        act (str, optional): The activation name in lowercase. It must be one of ['elu', 'gelu',

														
 
															-            'hardshrink', 'tanh', 'hardtanh', 'prelu', 'relu', 'relu6', 'selu', 'leakyrelu', 'sigmoid',

														
 
															-            'softmax', 'softplus', 'softshrink', 'softsign', 'tanhshrink', 'logsigmoid', 'logsoftmax',

														
 
															+        act (str, optional): Activation name in lowercase, which must be one of 

														
 
															+            ['elu', 'gelu', 'hardshrink', 'tanh', 'hardtanh', 'prelu', 'relu', 

														
 
															+            'relu6', 'selu', 'leakyrelu', 'sigmoid', 'softmax', 'softplus', 

														
 
															+            'softshrink', 'softsign', 'tanhshrink', 'logsigmoid', 'logsoftmax',

														
 
															             'hsigmoid']. Default: None, means identical transformation.

														
 
															     Returns:

														
 
															         A callable object of Activation.

														
 
															     Raises:

														
 
															         KeyError: When parameter `act` is not in the optional range.

														
 
															     Examples:

														
 
															-        from paddleseg.models.common.activation import Activation

														
 
															+        from paddlers.rs_models.seg.layers import Activation

														
 
															         relu = Activation("relu")

														
 
															         print(relu)

														
 
															         # <class 'paddle.nn.layer.activation.ReLU'>

														
--- a/paddlers/tasks/base.py
+++ b/paddlers/tasks/base.py
@@ -126,18 +126,18 @@ class BaseModel(metaclass=ModelMeta):
 
															             if not osp.exists(osp.join(resume_checkpoint, 'model.pdparams')):
														
 
															                 logging.error(
														
 
															                     "Model parameter state dictionary file 'model.pdparams' "
														
 
															-                    "not found under given checkpoint path {}".format(
														
 
															+                    "was not found in given checkpoint path {}!".format(
														
 
															                         resume_checkpoint),
														
 
															                     exit=True)
														
 
															             if not osp.exists(osp.join(resume_checkpoint, 'model.pdopt')):
														
 
															                 logging.error(
														
 
															                     "Optimizer state dictionary file 'model.pdparams' "
														
 
															-                    "not found under given checkpoint path {}".format(
														
 
															+                    "was not found in given checkpoint path {}!".format(
														
 
															                         resume_checkpoint),
														
 
															                     exit=True)
														
 
															             if not osp.exists(osp.join(resume_checkpoint, 'model.yml')):
														
 
															                 logging.error(
														
 
															-                    "'model.yml' not found under given checkpoint path {}".
														
 
															+                    "'model.yml' was not found in given checkpoint path {}!".
														
 
															                     format(resume_checkpoint),
														
 
															                     exit=True)
														
 
															             with open(osp.join(resume_checkpoint, "model.yml")) as f:
														
@@ -264,7 +264,7 @@ class BaseModel(metaclass=ModelMeta):
 
															     def build_data_loader(self, dataset, batch_size, mode='train'):
														
 
															         if dataset.num_samples < batch_size:
														
 
															-            raise Exception(
														
 
															+            raise ValueError(
														
 
															                 'The volume of dataset({}) must be larger than batch size({}).'
														
 
															                 .format(dataset.num_samples, batch_size))
														
 
															         batch_size_each_card = get_single_card_bs(batch_size=batch_size)
														
@@ -478,17 +478,21 @@ class BaseModel(metaclass=ModelMeta):
 
															                             save_dir='output'):
														
 
															         """
														
 
															         Args:
														
 
															-            dataset(paddlers.dataset): Dataset used for evaluation during sensitivity analysis.
														
 
															-            batch_size(int, optional): Batch size used in evaluation. Defaults to 8.
														
 
															-            criterion({'l1_norm', 'fpgm'}, optional): Pruning criterion. Defaults to 'l1_norm'.
														
 
															-            save_dir(str, optional): The directory to save sensitivity file of the model. Defaults to 'output'.
														
 
															+            dataset (paddlers.datasets.BaseDataset): Dataset used for evaluation during 
														
 
															+                sensitivity analysis.
														
 
															+            batch_size (int, optional): Batch size used in evaluation. Defaults to 8.
														
 
															+            criterion (str, optional): Pruning criterion. Choices are {'l1_norm', 'fpgm'}.
														
 
															+                Defaults to 'l1_norm'.
														
 
															+            save_dir (str, optional): Directory to save sensitivity file of the model. 
														
 
															+                Defaults to 'output'.
														
 
															         """
														
 
															+
														
 
															         if self.__class__.__name__ in {'FasterRCNN', 'MaskRCNN', 'PicoDet'}:
														
 
															-            raise Exception("{} does not support pruning currently!".format(
														
 
															+            raise ValueError("{} does not support pruning currently!".format(
														
 
															                 self.__class__.__name__))
														
 
															         assert criterion in {'l1_norm', 'fpgm'}, \
														
 
															-            "Pruning criterion {} is not supported. Please choose from ['l1_norm', 'fpgm']"
														
 
															+            "Pruning criterion {} is not supported. Please choose from {'l1_norm', 'fpgm'}."
														
 
															         self._check_transforms(dataset.transforms, 'eval')
														
 
															         if self.model_type == 'detector':
														
 
															             self.net.eval()
														
@@ -515,13 +519,14 @@ class BaseModel(metaclass=ModelMeta):
 
															     def prune(self, pruned_flops, save_dir=None):
														
 
															         """
														
 
															         Args:
														
 
															-            pruned_flops(float): Ratio of FLOPs to be pruned.
														
 
															-            save_dir(None or str, optional): If None, the pruned model will not be saved.
														
 
															-                Otherwise, the pruned model will be saved at save_dir. Defaults to None.
														
 
															+            pruned_flops (float): Ratio of FLOPs to be pruned.
														
 
															+            save_dir (str|None, optional): If None, the pruned model will not be 
														
 
															+                saved. Otherwise, the pruned model will be saved at `save_dir`. 
														
 
															+                Defaults to None.
														
 
															         """
														
 
															         if self.status == "Pruned":
														
 
															-            raise Exception(
														
 
															-                "A pruned model cannot be done model pruning again!")
														
 
															+            raise ValueError(
														
 
															+                "A pruned model cannot be pruned for a second time!")
														
 
															         pre_pruning_flops = flops(self.net, self.pruner.inputs)
														
 
															         logging.info("Pre-pruning FLOPs: {}. Pruning starts...".format(
														
 
															             pre_pruning_flops))
														
@@ -529,8 +534,8 @@ class BaseModel(metaclass=ModelMeta):
 
															         post_pruning_flops = flops(self.net, self.pruner.inputs)
														
 
															         logging.info("Pruning is complete. Post-pruning FLOPs: {}".format(
														
 
															             post_pruning_flops))
														
 
															-        logging.warning("Pruning the model may hurt its performance, "
														
 
															-                        "retraining is highly recommended")
														
 
															+        logging.warning("Pruning the model may hurt its performance. "
														
 
															+                        "Re-training is highly recommended.")
														
 
															         self.status = 'Pruned'
														
 
															         if save_dir is not None:
														
@@ -540,7 +545,7 @@ class BaseModel(metaclass=ModelMeta):
 
															     def _prepare_qat(self, quant_config):
														
 
															         if self.status == 'Infer':
														
 
															             logging.error(
														
 
															-                "Exported inference model does not support quantization aware training.",
														
 
															+                "Exported inference model does not support quantization-aware training.",
														
 
															                 exit=True)
														
 
															         if quant_config is None:
														
 
															             # default quantization configuration
														
@@ -578,7 +583,7 @@ class BaseModel(metaclass=ModelMeta):
 
															         elif quant_config != self.quant_config:
														
 
															             logging.error(
														
 
															                 "The model has been quantized with the following quant_config: {}."
														
 
															-                "Doing quantization-aware training with a quantized model "
														
 
															+                "Performing quantization-aware training with a quantized model "
														
 
															                 "using a different configuration is not supported."
														
 
															                 .format(self.quant_config),
														
 
															                 exit=True)
														
@@ -666,7 +671,7 @@ class BaseModel(metaclass=ModelMeta):
 
															         # 模型保存成功的标志
														
 
															         open(osp.join(save_dir, '.success'), 'w').close()
														
 
															-        logging.info("The model for the inference deployment is saved in {}.".
														
 
															+        logging.info("The inference model for deployment is saved in {}.".
														
 
															                      format(save_dir))
														
 
															     def _check_transforms(self, transforms, mode):
														
--- a/paddlers/tasks/change_detector.py
+++ b/paddlers/tasks/change_detector.py
@@ -238,29 +238,37 @@ class BaseChangeDetector(BaseModel):
 
															               resume_checkpoint=None):
														
 
															         """
														
 
															         Train the model.
														
 
															-        Args:
														
 
															-            num_epochs(int): The number of epochs.
														
 
															-            train_dataset(paddlers.dataset): Training dataset.
														
 
															-            train_batch_size(int, optional): Total batch size among all cards used in training. Defaults to 2.
														
 
															-            eval_dataset(paddlers.dataset, optional):
														
 
															-                Evaluation dataset. If None, the model will not be evaluated furing training process. Defaults to None.
														
 
															-            optimizer(paddle.optimizer.Optimizer or None, optional):
														
 
															-                Optimizer used in training. If None, a default optimizer is used. Defaults to None.
														
 
															-            save_interval_epochs(int, optional): Epoch interval for saving the model. Defaults to 1.
														
 
															-            log_interval_steps(int, optional): Step interval for printing training information. Defaults to 10.
														
 
															-            save_dir(str, optional): Directory to save the model. Defaults to 'output'.
														
 
															-            pretrain_weights(str or None, optional):
														
 
															-                None or name/path of pretrained weights. If None, no pretrained weights will be loaded. Defaults to None.
														
 
															-            learning_rate(float, optional): Learning rate for training. Defaults to .025.
														
 
															-            lr_decay_power(float, optional): Learning decay power. Defaults to .9.
														
 
															-            early_stop(bool, optional): Whether to adopt early stop strategy. Defaults to False.
														
 
															-            early_stop_patience(int, optional): Early stop patience. Defaults to 5.
														
 
															-            use_vdl(bool, optional): Whether to use VisualDL to monitor the training process. Defaults to True.
														
 
															-            resume_checkpoint(str or None, optional): The path of the checkpoint to resume training from.
														
 
															-                If None, no training checkpoint will be resumed. At most one of `resume_checkpoint` and
														
 
															-                `pretrain_weights` can be set simultaneously. Defaults to None.
														
 
															+        Args:
														
 
															+            num_epochs (int): Number of epochs.
														
 
															+            train_dataset (paddlers.datasets.CDDataset): Training dataset.
														
 
															+            train_batch_size (int, optional): Total batch size among all cards used in 
														
 
															+                training. Defaults to 2.
														
 
															+            eval_dataset (paddlers.datasets.CDDataset|None, optional): Evaluation dataset. 
														
 
															+                If None, the model will not be evaluated during training process. 
														
 
															+                Defaults to None.
														
 
															+            optimizer (paddle.optimizer.Optimizer|None, optional): Optimizer used in 
														
 
															+                training. If None, a default optimizer will be used. Defaults to None.
														
 
															+            save_interval_epochs (int, optional): Epoch interval for saving the model. 
														
 
															+                Defaults to 1.
														
 
															+            log_interval_steps (int, optional): Step interval for printing training 
														
 
															+                information. Defaults to 2.
														
 
															+            save_dir (str, optional): Directory to save the model. Defaults to 'output'.
														
 
															+            pretrain_weights (str|None, optional): None or name/path of pretrained 
														
 
															+                weights. If None, no pretrained weights will be loaded. Defaults to None.
														
 
															+            learning_rate (float, optional): Learning rate for training. Defaults to .01.
														
 
															+            lr_decay_power (float, optional): Learning decay power. Defaults to .9.
														
 
															+            early_stop (bool, optional): Whether to adopt early stop strategy. Defaults 
														
 
															+                to False.
														
 
															+            early_stop_patience (int, optional): Early stop patience. Defaults to 5.
														
 
															+            use_vdl (bool, optional): Whether to use VisualDL to monitor the training 
														
 
															+                process. Defaults to True.
														
 
															+            resume_checkpoint (str|None, optional): Path of the checkpoint to resume
														
 
															+                training from. If None, no training checkpoint will be resumed. At most
														
 
															+                Aone of `resume_checkpoint` and `pretrain_weights` can be set simultaneously.
														
 
															+                Defaults to None.
														
 
															         """
														
 
															+
														
 
															         if self.status == 'Infer':
														
 
															             logging.error(
														
 
															                 "Exported inference model does not support training.",
														
@@ -336,28 +344,37 @@ class BaseChangeDetector(BaseModel):
 
															                           quant_config=None):
														
 
															         """
														
 
															         Quantization-aware training.
														
 
															-        Args:
														
 
															-            num_epochs(int): The number of epochs.
														
 
															-            train_dataset(paddlers.dataset): Training dataset.
														
 
															-            train_batch_size(int, optional): Total batch size among all cards used in training. Defaults to 2.
														
 
															-            eval_dataset(paddlers.dataset, optional):
														
 
															-                Evaluation dataset. If None, the model will not be evaluated furing training process. Defaults to None.
														
 
															-            optimizer(paddle.optimizer.Optimizer or None, optional):
														
 
															-                Optimizer used in training. If None, a default optimizer is used. Defaults to None.
														
 
															-            save_interval_epochs(int, optional): Epoch interval for saving the model. Defaults to 1.
														
 
															-            log_interval_steps(int, optional): Step interval for printing training information. Defaults to 10.
														
 
															-            save_dir(str, optional): Directory to save the model. Defaults to 'output'.
														
 
															-            learning_rate(float, optional): Learning rate for training. Defaults to .025.
														
 
															-            lr_decay_power(float, optional): Learning decay power. Defaults to .9.
														
 
															-            early_stop(bool, optional): Whether to adopt early stop strategy. Defaults to False.
														
 
															-            early_stop_patience(int, optional): Early stop patience. Defaults to 5.
														
 
															-            use_vdl(bool, optional): Whether to use VisualDL to monitor the training process. Defaults to True.
														
 
															-            quant_config(dict or None, optional): Quantization configuration. If None, a default rule of thumb
														
 
															-                configuration will be used. Defaults to None.
														
 
															-            resume_checkpoint(str or None, optional): The path of the checkpoint to resume quantization-aware training
														
 
															-                from. If None, no training checkpoint will be resumed. Defaults to None.
														
 
															+        Args:
														
 
															+            num_epochs (int): Number of epochs.
														
 
															+            train_dataset (paddlers.datasets.CDDataset): Training dataset.
														
 
															+            train_batch_size (int, optional): Total batch size among all cards used in 
														
 
															+                training. Defaults to 2.
														
 
															+            eval_dataset (paddlers.datasets.CDDataset, optional): Evaluation dataset. 
														
 
															+                If None, the model will not be evaluated during training process. 
														
 
															+                Defaults to None.
														
 
															+            optimizer (paddle.optimizer.Optimizer|None, optional): Optimizer used in 
														
 
															+                training. If None, a default optimizer will be used. Defaults to None.
														
 
															+            save_interval_epochs (int, optional): Epoch interval for saving the model. 
														
 
															+                Defaults to 1.
														
 
															+            log_interval_steps (int, optional): Step interval for printing training 
														
 
															+                information. Defaults to 2.
														
 
															+            save_dir (str, optional): Directory to save the model. Defaults to 'output'.
														
 
															+            learning_rate (float, optional): Learning rate for training. 
														
 
															+                Defaults to .0001.
														
 
															+            lr_decay_power (float, optional): Learning decay power. Defaults to .9.
														
 
															+            early_stop (bool, optional): Whether to adopt early stop strategy. 
														
 
															+                Defaults to False.
														
 
															+            early_stop_patience (int, optional): Early stop patience. Defaults to 5.
														
 
															+            use_vdl (bool, optional): Whether to use VisualDL to monitor the training 
														
 
															+                process. Defaults to True.
														
 
															+            quant_config (dict|None, optional): Quantization configuration. If None, 
														
 
															+                a default rule of thumb configuration will be used. Defaults to None.
														
 
															+            resume_checkpoint (str|None, optional): Path of the checkpoint to resume
														
 
															+                quantization-aware training from. If None, no training checkpoint will
														
 
															+                be resumed. Defaults to None.
														
 
															         """
														
 
															+
														
 
															         self._prepare_qat(quant_config)
														
 
															         self.train(
														
 
															             num_epochs=num_epochs,
														
@@ -379,27 +396,32 @@ class BaseChangeDetector(BaseModel):
 
															     def evaluate(self, eval_dataset, batch_size=1, return_details=False):
														
 
															         """
														
 
															         Evaluate the model.
														
 
															+
														
 
															         Args:
														
 
															-            eval_dataset(paddlers.dataset): Evaluation dataset.
														
 
															-            batch_size(int, optional): Total batch size among all cards used for evaluation. Defaults to 1.
														
 
															-            return_details(bool, optional): Whether to return evaluation details. Defaults to False.
														
 
															+            eval_dataset (paddlers.datasets.CDDataset): Evaluation dataset.
														
 
															+            batch_size (int, optional): Total batch size among all cards used for 
														
 
															+                evaluation. Defaults to 1.
														
 
															+            return_details (bool, optional): Whether to return evaluation details. 
														
 
															+                Defaults to False.
														
 
															         Returns:
														
 
															             collections.OrderedDict with key-value pairs:
														
 
															-                For binary change detection (number of classes == 2), the key-value pairs are like:
														
 
															-                {"iou": `intersection over union for the change class`,
														
 
															-                 "f1": `F1 score for the change class`,
														
 
															-                 "oacc": `overall accuracy`,
														
 
															-                 "kappa": ` kappa coefficient`}.
														
 
															-                For multi-class change detection (number of classes > 2), the key-value pairs are like:
														
 
															-                {"miou": `mean intersection over union`,
														
 
															-                 "category_iou": `category-wise mean intersection over union`,
														
 
															-                 "oacc": `overall accuracy`,
														
 
															-                 "category_acc": `category-wise accuracy`,
														
 
															-                 "kappa": ` kappa coefficient`,
														
 
															-                 "category_F1-score": `F1 score`}.
														
 
															-
														
 
															+                For binary change detection (number of classes == 2), the key-value 
														
 
															+                    pairs are like:
														
 
															+                    {"iou": `intersection over union for the change class`,
														
 
															+                    "f1": `F1 score for the change class`,
														
 
															+                    "oacc": `overall accuracy`,
														
 
															+                    "kappa": ` kappa coefficient`}.
														
 
															+                For multi-class change detection (number of classes > 2), the key-value 
														
 
															+                    pairs are like:
														
 
															+                    {"miou": `mean intersection over union`,
														
 
															+                    "category_iou": `category-wise mean intersection over union`,
														
 
															+                    "oacc": `overall accuracy`,
														
 
															+                    "category_acc": `category-wise accuracy`,
														
 
															+                    "kappa": ` kappa coefficient`,
														
 
															+                    "category_F1-score": `F1 score`}.
														
 
															         """
														
 
															+
														
 
															         self._check_transforms(eval_dataset.transforms, 'eval')
														
 
															         self.net.eval()
														
@@ -500,24 +522,27 @@ class BaseChangeDetector(BaseModel):
 
															     def predict(self, img_file, transforms=None):
														
 
															         """
														
 
															         Do inference.
														
 
															+
														
 
															         Args:
														
 
															-            Args:
														
 
															-            img_file (list[tuple] | tuple[str | np.ndarray]):
														
 
															-                Tuple of image paths or decoded image data for bi-temporal images, which also could constitute a list,
														
 
															-                meaning all image pairs to be predicted as a mini-batch.
														
 
															-            transforms(paddlers.transforms.Compose or None, optional):
														
 
															-                Transforms for inputs. If None, the transforms for evaluation process will be used. Defaults to None.
														
 
															+            img_file (list[tuple] | tuple[str|np.ndarray]): Tuple of image paths or 
														
 
															+                decoded image data for bi-temporal images, which also could constitute
														
 
															+                a list, meaning all image pairs to be predicted as a mini-batch.
														
 
															+            transforms (paddlers.transforms.Compose|None, optional): Transforms for 
														
 
															+                inputs. If None, the transforms for evaluation process will be used. 
														
 
															+                Defaults to None.
														
 
															         Returns:
														
 
															-            If img_file is a tuple of string or np.array, the result is a dict with key-value pairs:
														
 
															-            {"label map": `label map`, "score_map": `score map`}.
														
 
															-            If img_file is a list, the result is a list composed of dicts with the corresponding fields:
														
 
															-            label_map(np.ndarray): the predicted label map (HW)
														
 
															-            score_map(np.ndarray): the prediction score map (HWC)
														
 
															-
														
 
															+            If `img_file` is a tuple of string or np.array, the result is a dict with 
														
 
															+                key-value pairs:
														
 
															+                {"label map": `label map`, "score_map": `score map`}.
														
 
															+            If `img_file` is a list, the result is a list composed of dicts with the 
														
 
															+                corresponding fields:
														
 
															+                label_map (np.ndarray): the predicted label map (HW)
														
 
															+                score_map (np.ndarray): the prediction score map (HWC)
														
 
															         """
														
 
															+
														
 
															         if transforms is None and not hasattr(self, 'test_transforms'):
														
 
															-            raise Exception("transforms need to be defined, now is None.")
														
 
															+            raise ValueError("transforms need to be defined, now is None.")
														
 
															         if transforms is None:
														
 
															             transforms = self.test_transforms
														
 
															         if isinstance(img_file, tuple):
														
@@ -555,26 +580,24 @@ class BaseChangeDetector(BaseModel):
 
															                        transforms=None):
														
 
															         """
														
 
															         Do inference.
														
 
															+
														
 
															         Args:
														
 
															-            Args:
														
 
															-            img_file(list[str]):
														
 
															-                List of image paths.
														
 
															-            save_dir(str):
														
 
															-                Directory that contains saved geotiff file.
														
 
															-            block_size(list[int] | tuple[int] | int, optional):
														
 
															-                Size of block.
														
 
															-            overlap(list[int] | tuple[int] | int, optional):
														
 
															-                Overlap between two blocks. Defaults to 36.
														
 
															-            transforms(paddlers.transforms.Compose or None, optional):
														
 
															-                Transforms for inputs. If None, the transforms for evaluation process will be used. Defaults to None.
														
 
															+            img_file (tuple[str]): Tuple of image paths.
														
 
															+            save_dir (str): Directory that contains saved geotiff file.
														
 
															+            block_size (list[int] | tuple[int] | int, optional): Size of block.
														
 
															+            overlap (list[int] | tuple[int] | int, optional): Overlap between two blocks. 
														
 
															+                Defaults to 36.
														
 
															+            transforms (paddlers.transforms.Compose|None, optional): Transforms for inputs.
														
 
															+                If None, the transforms for evaluation process will be used. Defaults to None.
														
 
															         """
														
 
															+
														
 
															         try:
														
 
															             from osgeo import gdal
														
 
															         except:
														
 
															             import gdal
														
 
															-        if len(img_file) != 2:
														
 
															-            raise ValueError("`img_file` must be a list of length 2.")
														
 
															+        if not isinstance(img_file, tuple) or len(img_file) != 2:
														
 
															+            raise ValueError("`img_file` must be a tuple of length 2.")
														
 
															         if isinstance(block_size, int):
														
 
															             block_size = (block_size, block_size)
														
 
															         elif isinstance(block_size, (tuple, list)) and len(block_size) == 2:
														
--- a/paddlers/tasks/classifier.py
+++ b/paddlers/tasks/classifier.py
@@ -52,7 +52,7 @@ class BaseClassifier(BaseModel):
 
															         super(BaseClassifier, self).__init__('classifier')
														
 
															         if not hasattr(paddleclas.arch.backbone, model_name) and \
														
 
															            not hasattr(cmcls, model_name):
														
 
															-            raise Exception("ERROR: There's no model named {}.".format(
														
 
															+            raise ValueError("ERROR: There is no model named {}.".format(
														
 
															                 model_name))
														
 
															         self.model_name = model_name
														
 
															         self.in_channels = in_channels
														
@@ -202,29 +202,39 @@ class BaseClassifier(BaseModel):
 
															               resume_checkpoint=None):
														
 
															         """
														
 
															         Train the model.
														
 
															-        Args:
														
 
															-            num_epochs(int): The number of epochs.
														
 
															-            train_dataset(paddlers.dataset): Training dataset.
														
 
															-            train_batch_size(int, optional): Total batch size among all cards used in training. Defaults to 2.
														
 
															-            eval_dataset(paddlers.dataset, optional):
														
 
															-                Evaluation dataset. If None, the model will not be evaluated furing training process. Defaults to None.
														
 
															-            optimizer(paddle.optimizer.Optimizer or None, optional):
														
 
															-                Optimizer used in training. If None, a default optimizer is used. Defaults to None.
														
 
															-            save_interval_epochs(int, optional): Epoch interval for saving the model. Defaults to 1.
														
 
															-            log_interval_steps(int, optional): Step interval for printing training information. Defaults to 10.
														
 
															-            save_dir(str, optional): Directory to save the model. Defaults to 'output'.
														
 
															-            pretrain_weights(str or None, optional):
														
 
															-                None or name/path of pretrained weights. If None, no pretrained weights will be loaded. Defaults to 'CITYSCAPES'.
														
 
															-            learning_rate(float, optional): Learning rate for training. Defaults to .025.
														
 
															-            lr_decay_power(float, optional): Learning decay power. Defaults to .9.
														
 
															-            early_stop(bool, optional): Whether to adopt early stop strategy. Defaults to False.
														
 
															-            early_stop_patience(int, optional): Early stop patience. Defaults to 5.
														
 
															-            use_vdl(bool, optional): Whether to use VisualDL to monitor the training process. Defaults to True.
														
 
															-            resume_checkpoint(str or None, optional): The path of the checkpoint to resume training from.
														
 
															-                If None, no training checkpoint will be resumed. At most one of `resume_checkpoint` and
														
 
															-                `pretrain_weights` can be set simultaneously. Defaults to None.
														
 
															+        Args:
														
 
															+            num_epochs (int): Number of epochs.
														
 
															+            train_dataset (paddlers.datasets.ClasDataset): Training dataset.
														
 
															+            train_batch_size (int, optional): Total batch size among all cards used in 
														
 
															+                training. Defaults to 2.
														
 
															+            eval_dataset (paddlers.datasets.ClasDataset, optional): Evaluation dataset. 
														
 
															+                If None, the model will not be evaluated during training process. 
														
 
															+                Defaults to None.
														
 
															+            optimizer (paddle.optimizer.Optimizer|None, optional): Optimizer used in 
														
 
															+                training. If None, a default optimizer will be used. Defaults to None.
														
 
															+            save_interval_epochs (int, optional): Epoch interval for saving the model. 
														
 
															+                Defaults to 1.
														
 
															+            log_interval_steps (int, optional): Step interval for printing training 
														
 
															+                information. Defaults to 2.
														
 
															+            save_dir (str, optional): Directory to save the model. Defaults to 'output'.
														
 
															+            pretrain_weights (str|None, optional): None or name/path of pretrained 
														
 
															+                weights. If None, no pretrained weights will be loaded. 
														
 
															+                Defaults to 'IMAGENET'.
														
 
															+            learning_rate (float, optional): Learning rate for training. 
														
 
															+                Defaults to .1.
														
 
															+            lr_decay_power (float, optional): Learning decay power. Defaults to .9.
														
 
															+            early_stop (bool, optional): Whether to adopt early stop strategy. 
														
 
															+                Defaults to False.
														
 
															+            early_stop_patience (int, optional): Early stop patience. Defaults to 5.
														
 
															+            use_vdl (bool, optional): Whether to use VisualDL to monitor the training 
														
 
															+                process. Defaults to True.
														
 
															+            resume_checkpoint (str|None, optional): Path of the checkpoint to resume
														
 
															+                training from. If None, no training checkpoint will be resumed. At most
														
 
															+                Aone of `resume_checkpoint` and `pretrain_weights` can be set simultaneously.
														
 
															+                Defaults to None.
														
 
															         """
														
 
															+
														
 
															         if self.status == 'Infer':
														
 
															             logging.error(
														
 
															                 "Exported inference model does not support training.",
														
@@ -303,28 +313,37 @@ class BaseClassifier(BaseModel):
 
															                           quant_config=None):
														
 
															         """
														
 
															         Quantization-aware training.
														
 
															-        Args:
														
 
															-            num_epochs(int): The number of epochs.
														
 
															-            train_dataset(paddlers.dataset): Training dataset.
														
 
															-            train_batch_size(int, optional): Total batch size among all cards used in training. Defaults to 2.
														
 
															-            eval_dataset(paddlers.dataset, optional):
														
 
															-                Evaluation dataset. If None, the model will not be evaluated furing training process. Defaults to None.
														
 
															-            optimizer(paddle.optimizer.Optimizer or None, optional):
														
 
															-                Optimizer used in training. If None, a default optimizer is used. Defaults to None.
														
 
															-            save_interval_epochs(int, optional): Epoch interval for saving the model. Defaults to 1.
														
 
															-            log_interval_steps(int, optional): Step interval for printing training information. Defaults to 10.
														
 
															-            save_dir(str, optional): Directory to save the model. Defaults to 'output'.
														
 
															-            learning_rate(float, optional): Learning rate for training. Defaults to .025.
														
 
															-            lr_decay_power(float, optional): Learning decay power. Defaults to .9.
														
 
															-            early_stop(bool, optional): Whether to adopt early stop strategy. Defaults to False.
														
 
															-            early_stop_patience(int, optional): Early stop patience. Defaults to 5.
														
 
															-            use_vdl(bool, optional): Whether to use VisualDL to monitor the training process. Defaults to True.
														
 
															-            quant_config(dict or None, optional): Quantization configuration. If None, a default rule of thumb
														
 
															-                configuration will be used. Defaults to None.
														
 
															-            resume_checkpoint(str or None, optional): The path of the checkpoint to resume quantization-aware training
														
 
															-                from. If None, no training checkpoint will be resumed. Defaults to None.
														
 
															+        Args:
														
 
															+            num_epochs (int): Number of epochs.
														
 
															+            train_dataset (paddlers.datasets.ClasDataset): Training dataset.
														
 
															+            train_batch_size (int, optional): Total batch size among all cards used in 
														
 
															+                training. Defaults to 2.
														
 
															+            eval_dataset (paddlers.datasets.ClasDataset, optional): Evaluation dataset. 
														
 
															+                If None, the model will not be evaluated during training process. 
														
 
															+                Defaults to None.
														
 
															+            optimizer (paddle.optimizer.Optimizer|None, optional): Optimizer used in 
														
 
															+                training. If None, a default optimizer will be used. Defaults to None.
														
 
															+            save_interval_epochs (int, optional): Epoch interval for saving the model. 
														
 
															+                Defaults to 1.
														
 
															+            log_interval_steps (int, optional): Step interval for printing training 
														
 
															+                information. Defaults to 2.
														
 
															+            save_dir (str, optional): Directory to save the model. Defaults to 'output'.
														
 
															+            learning_rate (float, optional): Learning rate for training. 
														
 
															+                Defaults to .0001.
														
 
															+            lr_decay_power (float, optional): Learning decay power. Defaults to .9.
														
 
															+            early_stop (bool, optional): Whether to adopt early stop strategy. 
														
 
															+                Defaults to False.
														
 
															+            early_stop_patience (int, optional): Early stop patience. Defaults to 5.
														
 
															+            use_vdl (bool, optional): Whether to use VisualDL to monitor the training 
														
 
															+                process. Defaults to True.
														
 
															+            quant_config (dict|None, optional): Quantization configuration. If None, 
														
 
															+                a default rule of thumb configuration will be used. Defaults to None.
														
 
															+            resume_checkpoint (str|None, optional): Path of the checkpoint to resume
														
 
															+                quantization-aware training from. If None, no training checkpoint will
														
 
															+                be resumed. Defaults to None.
														
 
															         """
														
 
															+
														
 
															         self._prepare_qat(quant_config)
														
 
															         self.train(
														
 
															             num_epochs=num_epochs,
														
@@ -346,17 +365,20 @@ class BaseClassifier(BaseModel):
 
															     def evaluate(self, eval_dataset, batch_size=1, return_details=False):
														
 
															         """
														
 
															         Evaluate the model.
														
 
															+
														
 
															         Args:
														
 
															-            eval_dataset(paddlers.dataset): Evaluation dataset.
														
 
															-            batch_size(int, optional): Total batch size among all cards used for evaluation. Defaults to 1.
														
 
															-            return_details(bool, optional): Whether to return evaluation details. Defaults to False.
														
 
															+            eval_dataset (paddlers.datasets.ClasDataset): Evaluation dataset.
														
 
															+            batch_size (int, optional): Total batch size among all cards used for 
														
 
															+                evaluation. Defaults to 1.
														
 
															+            return_details (bool, optional): Whether to return evaluation details. 
														
 
															+                Defaults to False.
														
 
															         Returns:
														
 
															             collections.OrderedDict with key-value pairs:
														
 
															                 {"top1": `acc of top1`,
														
 
															                  "top5": `acc of top5`}.
														
 
															-
														
 
															         """
														
 
															+
														
 
															         self._check_transforms(eval_dataset.transforms, 'eval')
														
 
															         self.net.eval()
														
@@ -404,25 +426,28 @@ class BaseClassifier(BaseModel):
 
															     def predict(self, img_file, transforms=None):
														
 
															         """
														
 
															         Do inference.
														
 
															+
														
 
															         Args:
														
 
															-            Args:
														
 
															-            img_file(list[np.ndarray | str] | str | np.ndarray):
														
 
															-                Image path or decoded image data, which also could constitute a list, meaning all images to be 
														
 
															+            img_file (list[np.ndarray|str] | str | np.ndarray): Image path or decoded 
														
 
															+                image data, which also could constitute a list, meaning all images to be 
														
 
															                 predicted as a mini-batch.
														
 
															-            transforms(paddlers.transforms.Compose or None, optional):
														
 
															-                Transforms for inputs. If None, the transforms for evaluation process will be used. Defaults to None.
														
 
															+            transforms (paddlers.transforms.Compose|None, optional): Transforms for 
														
 
															+                inputs. If None, the transforms for evaluation process will be used. 
														
 
															+                Defaults to None.
														
 
															         Returns:
														
 
															-            If img_file is a string or np.array, the result is a dict with key-value pairs:
														
 
															-            {"label map": `class_ids_map`, "scores_map": `label_names_map`}.
														
 
															-            If img_file is a list, the result is a list composed of dicts with the corresponding fields:
														
 
															-            class_ids_map(np.ndarray): class_ids
														
 
															-            scores_map(np.ndarray): scores
														
 
															-            label_names_map(np.ndarray): label_names
														
 
															-
														
 
															+            If `img_file` is a string or np.array, the result is a dict with key-value 
														
 
															+                pairs:
														
 
															+                {"label map": `class_ids_map`, "scores_map": `label_names_map`}.
														
 
															+            If `img_file` is a list, the result is a list composed of dicts with the 
														
 
															+                corresponding fields:
														
 
															+                class_ids_map (np.ndarray): class_ids
														
 
															+                scores_map (np.ndarray): scores
														
 
															+                label_names_map (np.ndarray): label_names
														
 
															         """
														
 
															+
														
 
															         if transforms is None and not hasattr(self, 'test_transforms'):
														
 
															-            raise Exception("transforms need to be defined, now is None.")
														
 
															+            raise ValueError("transforms need to be defined, now is None.")
														
 
															         if transforms is None:
														
 
															             transforms = self.test_transforms
														
 
															         if isinstance(img_file, (str, np.ndarray)):
														
--- a/paddlers/tasks/load_model.py
+++ b/paddlers/tasks/load_model.py
@@ -52,7 +52,7 @@ def load_model(model_dir, **params):
 
															     Load saved model from a given directory.
														
 
															     Args:
														
 
															-        model_dir(str): The directory where the model is saved.
														
 
															+        model_dir(str): Directory where the model is saved.
														
 
															     Returns:
														
 
															         The model loaded from the directory.
														
@@ -61,8 +61,8 @@ def load_model(model_dir, **params):
 
															     if not osp.exists(model_dir):
														
 
															         logging.error("Directory '{}' does not exist!".format(model_dir))
														
 
															     if not osp.exists(osp.join(model_dir, "model.yml")):
														
 
															-        raise Exception("There is no file named model.yml in {}.".format(
														
 
															-            model_dir))
														
 
															+        raise FileNotFoundError(
														
 
															+            "There is no file named model.yml in {}.".format(model_dir))
														
 
															     with open(osp.join(model_dir, "model.yml")) as f:
														
 
															         model_info = yaml.load(f.read(), Loader=yaml.Loader)
														
@@ -76,7 +76,7 @@ def load_model(model_dir, **params):
 
															     model_type = model_info['_Attributes']['model_type']
														
 
															     mod = getattr(paddlers.tasks, model_type)
														
 
															     if not hasattr(mod, model_info['Model']):
														
 
															-        raise Exception("There is no {} attribute in {}.".format(model_info[
														
 
															+        raise ValueError("There is no {} attribute in {}.".format(model_info[
														
 
															             'Model'], mod))
														
 
															     if 'model_name' in model_info['_init_params']:
														
 
															         del model_info['_init_params']['model_name']
														
--- a/paddlers/tasks/object_detector.py
+++ b/paddlers/tasks/object_detector.py
@@ -81,7 +81,7 @@ class BaseDetector(BaseModel):
 
															         if len(image_shape) == 2:
														
 
															             image_shape = [1, 3] + image_shape
														
 
															         if image_shape[-2] % 32 > 0 or image_shape[-1] % 32 > 0:
														
 
															-            raise Exception(
														
 
															+            raise ValueError(
														
 
															                 "Height and width in fixed_input_shape must be a multiple of 32, but received {}.".
														
 
															                 format(image_shape[-2:]))
														
 
															         return image_shape
														
@@ -206,34 +206,51 @@ class BaseDetector(BaseModel):
 
															               resume_checkpoint=None):
														
 
															         """
														
 
															         Train the model.
														
 
															+
														
 
															         Args:
														
 
															-            num_epochs(int): The number of epochs.
														
 
															-            train_dataset(paddlers.dataset): Training dataset.
														
 
															-            train_batch_size(int, optional): Total batch size among all cards used in training. Defaults to 64.
														
 
															-            eval_dataset(paddlers.dataset, optional):
														
 
															-                Evaluation dataset. If None, the model will not be evaluated during training process. Defaults to None.
														
 
															-            optimizer(paddle.optimizer.Optimizer or None, optional):
														
 
															-                Optimizer used for training. If None, a default optimizer is used. Defaults to None.
														
 
															-            save_interval_epochs(int, optional): Epoch interval for saving the model. Defaults to 1.
														
 
															-            log_interval_steps(int, optional): Step interval for printing training information. Defaults to 10.
														
 
															-            save_dir(str, optional): Directory to save the model. Defaults to 'output'.
														
 
															-            pretrain_weights(str or None, optional):
														
 
															-                None or name/path of pretrained weights. If None, no pretrained weights will be loaded. Defaults to 'IMAGENET'.
														
 
															-            learning_rate(float, optional): Learning rate for training. Defaults to .001.
														
 
															-            warmup_steps(int, optional): The number of steps of warm-up training. Defaults to 0.
														
 
															-            warmup_start_lr(float, optional): Start learning rate of warm-up training. Defaults to 0..
														
 
															-            lr_decay_epochs(list or tuple, optional): Epoch milestones for learning rate decay. Defaults to (216, 243).
														
 
															-            lr_decay_gamma(float, optional): Gamma coefficient of learning rate decay. Defaults to .1.
														
 
															-            metric({'VOC', 'COCO', None}, optional):
														
 
															-                Evaluation metric. If None, determine the metric according to the dataset format. Defaults to None.
														
 
															-            use_ema(bool, optional): Whether to use exponential moving average strategy. Defaults to False.
														
 
															-            early_stop(bool, optional): Whether to adopt early stop strategy. Defaults to False.
														
 
															-            early_stop_patience(int, optional): Early stop patience. Defaults to 5.
														
 
															-            use_vdl(bool, optional): Whether to use VisualDL to monitor the training process. Defaults to True.
														
 
															-            resume_checkpoint(str or None, optional): The path of the checkpoint to resume training from.
														
 
															-                If None, no training checkpoint will be resumed. At most one of `resume_checkpoint` and
														
 
															-                `pretrain_weights` can be set simultaneously. Defaults to None.
														
 
															+            num_epochs (int): Number of epochs.
														
 
															+            train_dataset (paddlers.datasets.COCODetDataset|paddlers.datasets.VOCDetDataset): 
														
 
															+                Training dataset.
														
 
															+            train_batch_size (int, optional): Total batch size among all cards used in 
														
 
															+                training. Defaults to 64.
														
 
															+            eval_dataset (paddlers.datasets.COCODetDataset|paddlers.datasets.VOCDetDataset, optional): 
														
 
															+                Evaluation dataset. If None, the model will not be evaluated during training 
														
 
															+                process. Defaults to None.
														
 
															+            optimizer (paddle.optimizer.Optimizer|None, optional): Optimizer used for 
														
 
															+                training. If None, a default optimizer will be used. Defaults to None.
														
 
															+            save_interval_epochs (int, optional): Epoch interval for saving the model. 
														
 
															+                Defaults to 1.
														
 
															+            log_interval_steps (int, optional): Step interval for printing training 
														
 
															+                information. Defaults to 10.
														
 
															+            save_dir (str, optional): Directory to save the model. Defaults to 'output'.
														
 
															+            pretrain_weights (str|None, optional): None or name/path of pretrained 
														
 
															+                weights. If None, no pretrained weights will be loaded. 
														
 
															+                Defaults to 'IMAGENET'.
														
 
															+            learning_rate (float, optional): Learning rate for training. Defaults to .001.
														
 
															+            warmup_steps (int, optional): Number of steps of warm-up training. 
														
 
															+                Defaults to 0.
														
 
															+            warmup_start_lr (float, optional): Start learning rate of warm-up training. 
														
 
															+                Defaults to 0..
														
 
															+            lr_decay_epochs (list|tuple, optional): Epoch milestones for learning 
														
 
															+                rate decay. Defaults to (216, 243).
														
 
															+            lr_decay_gamma (float, optional): Gamma coefficient of learning rate decay. 
														
 
															+                Defaults to .1.
														
 
															+            metric (str|None, optional): Evaluation metric. Choices are {'VOC', 'COCO', None}. 
														
 
															+                If None, determine the metric according to the  dataset format. 
														
 
															+                Defaults to None.
														
 
															+            use_ema (bool, optional): Whether to use exponential moving average 
														
 
															+                strategy. Defaults to False.
														
 
															+            early_stop (bool, optional): Whether to adopt early stop strategy. 
														
 
															+                Defaults to False.
														
 
															+            early_stop_patience (int, optional): Early stop patience. Defaults to 5.
														
 
															+            use_vdl(bool, optional): Whether to use VisualDL to monitor the training 
														
 
															+                process. Defaults to True.
														
 
															+            resume_checkpoint (str|None, optional): Path of the checkpoint to resume
														
 
															+                training from. If None, no training checkpoint will be resumed. At most
														
 
															+                Aone of `resume_checkpoint` and `pretrain_weights` can be set simultaneously.
														
 
															+                Defaults to None.
														
 
															         """
														
 
															+
														
 
															         if self.status == 'Infer':
														
 
															             logging.error(
														
 
															                 "Exported inference model does not support training.",
														
@@ -242,7 +259,7 @@ class BaseDetector(BaseModel):
 
															             logging.error(
														
 
															                 "pretrain_weights and resume_checkpoint cannot be set simultaneously.",
														
 
															                 exit=True)
														
 
															-        if train_dataset.__class__.__name__ == 'VOCDetection':
														
 
															+        if train_dataset.__class__.__name__ == 'VOCDetDataset':
														
 
															             train_dataset.data_fields = {
														
 
															                 'im_id', 'image_shape', 'image', 'gt_bbox', 'gt_class',
														
 
															                 'difficult'
														
@@ -260,13 +277,13 @@ class BaseDetector(BaseModel):
 
															                 }
														
 
															         if metric is None:
														
 
															-            if eval_dataset.__class__.__name__ == 'VOCDetection':
														
 
															+            if eval_dataset.__class__.__name__ == 'VOCDetDataset':
														
 
															                 self.metric = 'voc'
														
 
															-            elif eval_dataset.__class__.__name__ == 'CocoDetection':
														
 
															+            elif eval_dataset.__class__.__name__ == 'COCODetDataset':
														
 
															                 self.metric = 'coco'
														
 
															         else:
														
 
															             assert metric.lower() in ['coco', 'voc'], \
														
 
															-                "Evaluation metric {} is not supported, please choose form 'COCO' and 'VOC'"
														
 
															+                "Evaluation metric {} is not supported. Please choose from 'COCO' and 'VOC'."
														
 
															             self.metric = metric.lower()
														
 
															         self.labels = train_dataset.labels
														
@@ -355,33 +372,50 @@ class BaseDetector(BaseModel):
 
															                           quant_config=None):
														
 
															         """
														
 
															         Quantization-aware training.
														
 
															+
														
 
															         Args:
														
 
															-            num_epochs(int): The number of epochs.
														
 
															-            train_dataset(paddlers.dataset): Training dataset.
														
 
															-            train_batch_size(int, optional): Total batch size among all cards used in training. Defaults to 64.
														
 
															-            eval_dataset(paddlers.dataset, optional):
														
 
															-                Evaluation dataset. If None, the model will not be evaluated during training process. Defaults to None.
														
 
															-            optimizer(paddle.optimizer.Optimizer or None, optional):
														
 
															-                Optimizer used for training. If None, a default optimizer is used. Defaults to None.
														
 
															-            save_interval_epochs(int, optional): Epoch interval for saving the model. Defaults to 1.
														
 
															-            log_interval_steps(int, optional): Step interval for printing training information. Defaults to 10.
														
 
															-            save_dir(str, optional): Directory to save the model. Defaults to 'output'.
														
 
															-            learning_rate(float, optional): Learning rate for training. Defaults to .001.
														
 
															-            warmup_steps(int, optional): The number of steps of warm-up training. Defaults to 0.
														
 
															-            warmup_start_lr(float, optional): Start learning rate of warm-up training. Defaults to 0..
														
 
															-            lr_decay_epochs(list or tuple, optional): Epoch milestones for learning rate decay. Defaults to (216, 243).
														
 
															-            lr_decay_gamma(float, optional): Gamma coefficient of learning rate decay. Defaults to .1.
														
 
															-            metric({'VOC', 'COCO', None}, optional):
														
 
															-                Evaluation metric. If None, determine the metric according to the dataset format. Defaults to None.
														
 
															-            use_ema(bool, optional): Whether to use exponential moving average strategy. Defaults to False.
														
 
															-            early_stop(bool, optional): Whether to adopt early stop strategy. Defaults to False.
														
 
															-            early_stop_patience(int, optional): Early stop patience. Defaults to 5.
														
 
															-            use_vdl(bool, optional): Whether to use VisualDL to monitor the training process. Defaults to True.
														
 
															-            quant_config(dict or None, optional): Quantization configuration. If None, a default rule of thumb
														
 
															-                configuration will be used. Defaults to None.
														
 
															-            resume_checkpoint(str or None, optional): The path of the checkpoint to resume quantization-aware training
														
 
															-                from. If None, no training checkpoint will be resumed. Defaults to None.
														
 
															+            num_epochs (int): Number of epochs.
														
 
															+            train_dataset (paddlers.datasets.COCODetDataset|paddlers.datasets.VOCDetDataset): 
														
 
															+                Training dataset.
														
 
															+            train_batch_size (int, optional): Total batch size among all cards used in 
														
 
															+                training. Defaults to 64.
														
 
															+            eval_dataset (paddlers.datasets.COCODetDataset|paddlers.datasets.VOCDetDataset, optional): 
														
 
															+                Evaluation dataset. If None, the model will not be evaluated during training 
														
 
															+                process. Defaults to None.
														
 
															+            optimizer (paddle.optimizer.Optimizer or None, optional): Optimizer used for 
														
 
															+                training. If None, a default optimizer will be used. Defaults to None.
														
 
															+            save_interval_epochs (int, optional): Epoch interval for saving the model. 
														
 
															+                Defaults to 1.
														
 
															+            log_interval_steps (int, optional): Step interval for printing training 
														
 
															+                information. Defaults to 10.
														
 
															+            save_dir (str, optional): Directory to save the model. Defaults to 'output'.
														
 
															+            learning_rate (float, optional): Learning rate for training. 
														
 
															+                Defaults to .00001.
														
 
															+            warmup_steps (int, optional): Number of steps of warm-up training. 
														
 
															+                Defaults to 0.
														
 
															+            warmup_start_lr (float, optional): Start learning rate of warm-up training. 
														
 
															+                Defaults to 0..
														
 
															+            lr_decay_epochs (list or tuple, optional): Epoch milestones for learning rate 
														
 
															+                decay. Defaults to (216, 243).
														
 
															+            lr_decay_gamma (float, optional): Gamma coefficient of learning rate decay. 
														
 
															+                Defaults to .1.
														
 
															+            metric (str|None, optional): Evaluation metric. Choices are {'VOC', 'COCO', None}. 
														
 
															+                If None, determine the metric according to the dataset format. 
														
 
															+                Defaults to None.
														
 
															+            use_ema (bool, optional): Whether to use exponential moving average strategy. 
														
 
															+                Defaults to False.
														
 
															+            early_stop (bool, optional): Whether to adopt early stop strategy. 
														
 
															+                Defaults to False.
														
 
															+            early_stop_patience (int, optional): Early stop patience. Defaults to 5.
														
 
															+            use_vdl (bool, optional): Whether to use VisualDL to monitor the training 
														
 
															+                process. Defaults to True.
														
 
															+            quant_config (dict or None, optional): Quantization configuration. If None, 
														
 
															+                a default rule of thumb configuration will be used. Defaults to None.
														
 
															+            resume_checkpoint (str|None, optional): Path of the checkpoint to resume
														
 
															+                quantization-aware training from. If None, no training checkpoint will
														
 
															+                be resumed. Defaults to None.
														
 
															         """
														
 
															+
														
 
															         self._prepare_qat(quant_config)
														
 
															         self.train(
														
 
															             num_epochs=num_epochs,
														
@@ -412,25 +446,32 @@ class BaseDetector(BaseModel):
 
															                  return_details=False):
														
 
															         """
														
 
															         Evaluate the model.
														
 
															+
														
 
															         Args:
														
 
															-            eval_dataset(paddlers.dataset): Evaluation dataset.
														
 
															-            batch_size(int, optional): Total batch size among all cards used for evaluation. Defaults to 1.
														
 
															-            metric({'VOC', 'COCO', None}, optional):
														
 
															-                Evaluation metric. If None, determine the metric according to the dataset format. Defaults to None.
														
 
															-            return_details(bool, optional): Whether to return evaluation details. Defaults to False.
														
 
															+            eval_dataset (paddlers.datasets.COCODetDataset|paddlers.datasets.VOCDetDataset): 
														
 
															+                Evaluation dataset.
														
 
															+            batch_size (int, optional): Total batch size among all cards used for 
														
 
															+                evaluation. Defaults to 1.
														
 
															+            metric (str|None, optional): Evaluation metric. Choices are {'VOC', 'COCO', None}. 
														
 
															+                If None, determine the metric according to the dataset format. 
														
 
															+                Defaults to None.
														
 
															+            return_details (bool, optional): Whether to return evaluation details. 
														
 
															+                Defaults to False.
														
 
															+
														
 
															         Returns:
														
 
															-            collections.OrderedDict with key-value pairs: {"mAP(0.50, 11point)":`mean average precision`}.
														
 
															+            collections.OrderedDict with key-value pairs: 
														
 
															+                {"mAP(0.50, 11point)":`mean average precision`}.
														
 
															         """
														
 
															         if metric is None:
														
 
															             if not hasattr(self, 'metric'):
														
 
															-                if eval_dataset.__class__.__name__ == 'VOCDetection':
														
 
															+                if eval_dataset.__class__.__name__ == 'VOCDetDataset':
														
 
															                     self.metric = 'voc'
														
 
															-                elif eval_dataset.__class__.__name__ == 'CocoDetection':
														
 
															+                elif eval_dataset.__class__.__name__ == 'COCODetDataset':
														
 
															                     self.metric = 'coco'
														
 
															         else:
														
 
															             assert metric.lower() in ['coco', 'voc'], \
														
 
															-                "Evaluation metric {} is not supported, please choose form 'COCO' and 'VOC'"
														
 
															+                "Evaluation metric {} is not supported. Please choose from 'COCO' and 'VOC'."
														
 
															             self.metric = metric.lower()
														
 
															         if self.metric == 'voc':
														
@@ -506,24 +547,32 @@ class BaseDetector(BaseModel):
 
															     def predict(self, img_file, transforms=None):
														
 
															         """
														
 
															         Do inference.
														
 
															+
														
 
															         Args:
														
 
															-            img_file(list[np.ndarray | str] | str | np.ndarray):
														
 
															-                Image path or decoded image data, which also could constitute a list,meaning all images to be 
														
 
															+            img_file (list[np.ndarray|str] | str | np.ndarray): Image path or decoded 
														
 
															+                image data, which also could constitute a list, meaning all images to be 
														
 
															                 predicted as a mini-batch.
														
 
															-            transforms(paddlers.transforms.Compose or None, optional):
														
 
															-                Transforms for inputs. If None, the transforms for evaluation process will be used. Defaults to None.
														
 
															+            transforms (paddlers.transforms.Compose|None, optional): Transforms for 
														
 
															+                inputs. If None, the transforms for evaluation process  will be used. 
														
 
															+                Defaults to None.
														
 
															+
														
 
															         Returns:
														
 
															-            If img_file is a string or np.array, the result is a list of dict with key-value pairs:
														
 
															-            {"category_id": `category_id`, "category": `category`, "bbox": `[x, y, w, h]`, "score": `score`}.
														
 
															-            If img_file is a list, the result is a list composed of dicts with the corresponding fields:
														
 
															-            category_id(int): the predicted category ID. 0 represents the first category in the dataset, and so on.
														
 
															-            category(str): category name
														
 
															-            bbox(list): bounding box in [x, y, w, h] format
														
 
															-            score(str): confidence
														
 
															-            mask(dict): Only for instance segmentation task. Mask of the object in RLE format
														
 
															+            If `img_file` is a string or np.array, the result is a list of dict with 
														
 
															+                key-value pairs:
														
 
															+                {"category_id": `category_id`, "category": `category`, "bbox": `[x, y, w, h]`, "score": `score`}.
														
 
															+            If `img_file` is a list, the result is a list composed of dicts with the 
														
 
															+                corresponding fields:
														
 
															+                category_id(int): the predicted category ID. 0 represents the first 
														
 
															+                    category in the dataset, and so on.
														
 
															+                category(str): category name
														
 
															+                bbox(list): bounding box in [x, y, w, h] format
														
 
															+                score(str): confidence
														
 
															+                mask(dict): Only for instance segmentation task. Mask of the object in 
														
 
															+                    RLE format
														
 
															         """
														
 
															+
														
 
															         if transforms is None and not hasattr(self, 'test_transforms'):
														
 
															-            raise Exception("transforms need to be defined, now is None.")
														
 
															+            raise ValueError("transforms need to be defined, now is None.")
														
 
															         if transforms is None:
														
 
															             transforms = self.test_transforms
														
 
															         if isinstance(img_file, (str, np.ndarray)):
														
@@ -649,7 +698,7 @@ class PicoDet(BaseDetector):
 
															         }:
														
 
															             raise ValueError(
														
 
															                 "backbone: {} is not supported. Please choose one of "
														
 
															-                "('ESNet_s', 'ESNet_m', 'ESNet_l', 'LCNet', 'MobileNetV3', 'ResNet18_vd')".
														
 
															+                "{'ESNet_s', 'ESNet_m', 'ESNet_l', 'LCNet', 'MobileNetV3', 'ResNet18_vd'}.".
														
 
															                 format(backbone))
														
 
															         self.backbone_name = backbone
														
 
															         if params.get('with_net', True):
														
@@ -772,7 +821,7 @@ class PicoDet(BaseDetector):
 
															         for i, op in enumerate(transforms.transforms):
														
 
															             if isinstance(op, (BatchRandomResize, BatchRandomResizeByShort)):
														
 
															                 if mode != 'train':
														
 
															-                    raise Exception(
														
 
															+                    raise ValueError(
														
 
															                         "{} cannot be present in the {} transforms. ".format(
														
 
															                             op.__class__.__name__, mode) +
														
 
															                         "Please check the {} transforms.".format(mode))
														
@@ -851,34 +900,51 @@ class PicoDet(BaseDetector):
 
															               resume_checkpoint=None):
														
 
															         """
														
 
															         Train the model.
														
 
															+
														
 
															         Args:
														
 
															-            num_epochs(int): The number of epochs.
														
 
															-            train_dataset(paddlers.dataset): Training dataset.
														
 
															-            train_batch_size(int, optional): Total batch size among all cards used in training. Defaults to 64.
														
 
															-            eval_dataset(paddlers.dataset, optional):
														
 
															-                Evaluation dataset. If None, the model will not be evaluated during training process. Defaults to None.
														
 
															-            optimizer(paddle.optimizer.Optimizer or None, optional):
														
 
															-                Optimizer used for training. If None, a default optimizer is used. Defaults to None.
														
 
															-            save_interval_epochs(int, optional): Epoch interval for saving the model. Defaults to 1.
														
 
															-            log_interval_steps(int, optional): Step interval for printing training information. Defaults to 10.
														
 
															-            save_dir(str, optional): Directory to save the model. Defaults to 'output'.
														
 
															-            pretrain_weights(str or None, optional):
														
 
															-                None or name/path of pretrained weights. If None, no pretrained weights will be loaded. Defaults to 'IMAGENET'.
														
 
															-            learning_rate(float, optional): Learning rate for training. Defaults to .001.
														
 
															-            warmup_steps(int, optional): The number of steps of warm-up training. Defaults to 0.
														
 
															-            warmup_start_lr(float, optional): Start learning rate of warm-up training. Defaults to 0..
														
 
															-            lr_decay_epochs(list or tuple, optional): Epoch milestones for learning rate decay. Defaults to (216, 243).
														
 
															-            lr_decay_gamma(float, optional): Gamma coefficient of learning rate decay. Defaults to .1.
														
 
															-            metric({'VOC', 'COCO', None}, optional):
														
 
															-                Evaluation metric. If None, determine the metric according to the dataset format. Defaults to None.
														
 
															-            use_ema(bool, optional): Whether to use exponential moving average strategy. Defaults to False.
														
 
															-            early_stop(bool, optional): Whether to adopt early stop strategy. Defaults to False.
														
 
															-            early_stop_patience(int, optional): Early stop patience. Defaults to 5.
														
 
															-            use_vdl(bool, optional): Whether to use VisualDL to monitor the training process. Defaults to True.
														
 
															-            resume_checkpoint(str or None, optional): The path of the checkpoint to resume training from.
														
 
															-                If None, no training checkpoint will be resumed. At most one of `resume_checkpoint` and
														
 
															-                `pretrain_weights` can be set simultaneously. Defaults to None.
														
 
															+            num_epochs (int): Number of epochs.
														
 
															+            train_dataset (paddlers.datasets.COCODetDataset|paddlers.datasets.VOCDetDataset): 
														
 
															+                Training dataset.
														
 
															+            train_batch_size (int, optional): Total batch size among all cards used in 
														
 
															+                training. Defaults to 64.
														
 
															+            eval_dataset (paddlers.datasets.COCODetDataset|paddlers.datasets.VOCDetDataset, optional): 
														
 
															+                Evaluation dataset. If None, the model will not be evaluated during training 
														
 
															+                process. Defaults to None.
														
 
															+            optimizer (paddle.optimizer.Optimizer|None, optional): Optimizer used for 
														
 
															+                training. If None, a default optimizer will be used. Defaults to None.
														
 
															+            save_interval_epochs (int, optional): Epoch interval for saving the model. 
														
 
															+                Defaults to 1.
														
 
															+            log_interval_steps (int, optional): Step interval for printing training 
														
 
															+                information. Defaults to 10.
														
 
															+            save_dir (str, optional): Directory to save the model. Defaults to 'output'.
														
 
															+            pretrain_weights (str|None, optional): None or name/path of pretrained 
														
 
															+                weights. If None, no pretrained weights will be loaded. 
														
 
															+                Defaults to 'IMAGENET'.
														
 
															+            learning_rate (float, optional): Learning rate for training. Defaults to .001.
														
 
															+            warmup_steps (int, optional): Number of steps of warm-up training. 
														
 
															+                Defaults to 0.
														
 
															+            warmup_start_lr (float, optional): Start learning rate of warm-up training. 
														
 
															+                Defaults to 0..
														
 
															+            lr_decay_epochs (list|tuple, optional): Epoch milestones for learning 
														
 
															+                rate decay. Defaults to (216, 243).
														
 
															+            lr_decay_gamma (float, optional): Gamma coefficient of learning rate decay. 
														
 
															+                Defaults to .1.
														
 
															+            metric (str|None, optional): Evaluation metric. Choices are {'VOC', 'COCO', None}. 
														
 
															+                If None, determine the metric according to the  dataset format. 
														
 
															+                Defaults to None.
														
 
															+            use_ema (bool, optional): Whether to use exponential moving average 
														
 
															+                strategy. Defaults to False.
														
 
															+            early_stop (bool, optional): Whether to adopt early stop strategy. 
														
 
															+                Defaults to False.
														
 
															+            early_stop_patience (int, optional): Early stop patience. Defaults to 5.
														
 
															+            use_vdl(bool, optional): Whether to use VisualDL to monitor the training 
														
 
															+                process. Defaults to True.
														
 
															+            resume_checkpoint (str|None, optional): Path of the checkpoint to resume
														
 
															+                training from. If None, no training checkpoint will be resumed. At most
														
 
															+                Aone of `resume_checkpoint` and `pretrain_weights` can be set simultaneously.
														
 
															+                Defaults to None.
														
 
															         """
														
 
															+
														
 
															         if optimizer is None:
														
 
															             num_steps_each_epoch = len(train_dataset) // train_batch_size
														
 
															             optimizer = self.default_optimizer(
														
@@ -936,8 +1002,8 @@ class YOLOv3(BaseDetector):
 
															         }:
														
 
															             raise ValueError(
														
 
															                 "backbone: {} is not supported. Please choose one of "
														
 
															-                "('MobileNetV1', 'MobileNetV1_ssld', 'MobileNetV3', 'MobileNetV3_ssld', 'DarkNet53', "
														
 
															-                "'ResNet50_vd_dcn', 'ResNet34')".format(backbone))
														
 
															+                "{'MobileNetV1', 'MobileNetV1_ssld', 'MobileNetV3', 'MobileNetV3_ssld', 'DarkNet53', "
														
 
															+                "'ResNet50_vd_dcn', 'ResNet34'}.".format(backbone))
														
 
															         self.backbone_name = backbone
														
 
															         if params.get('with_net', True):
														
@@ -1030,7 +1096,7 @@ class YOLOv3(BaseDetector):
 
															         for i, op in enumerate(transforms.transforms):
														
 
															             if isinstance(op, (BatchRandomResize, BatchRandomResizeByShort)):
														
 
															                 if mode != 'train':
														
 
															-                    raise Exception(
														
 
															+                    raise ValueError(
														
 
															                         "{} cannot be present in the {} transforms. ".format(
														
 
															                             op.__class__.__name__, mode) +
														
 
															                         "Please check the {} transforms.".format(mode))
														
@@ -1089,8 +1155,8 @@ class FasterRCNN(BaseDetector):
 
															         }:
														
 
															             raise ValueError(
														
 
															                 "backbone: {} is not supported. Please choose one of "
														
 
															-                "('ResNet50', 'ResNet50_vd', 'ResNet50_vd_ssld', 'ResNet34', 'ResNet34_vd', "
														
 
															-                "'ResNet101', 'ResNet101_vd', 'HRNet_W18')".format(backbone))
														
 
															+                "{'ResNet50', 'ResNet50_vd', 'ResNet50_vd_ssld', 'ResNet34', 'ResNet34_vd', "
														
 
															+                "'ResNet101', 'ResNet101_vd', 'HRNet_W18'}.".format(backbone))
														
 
															         self.backbone_name = backbone
														
 
															         if params.get('with_net', True):
														
@@ -1327,34 +1393,51 @@ class FasterRCNN(BaseDetector):
 
															               resume_checkpoint=None):
														
 
															         """
														
 
															         Train the model.
														
 
															+
														
 
															         Args:
														
 
															-            num_epochs(int): The number of epochs.
														
 
															-            train_dataset(paddlers.dataset): Training dataset.
														
 
															-            train_batch_size(int, optional): Total batch size among all cards used in training. Defaults to 64.
														
 
															-            eval_dataset(paddlers.dataset, optional):
														
 
															-                Evaluation dataset. If None, the model will not be evaluated during training process. Defaults to None.
														
 
															-            optimizer(paddle.optimizer.Optimizer or None, optional):
														
 
															-                Optimizer used for training. If None, a default optimizer is used. Defaults to None.
														
 
															-            save_interval_epochs(int, optional): Epoch interval for saving the model. Defaults to 1.
														
 
															-            log_interval_steps(int, optional): Step interval for printing training information. Defaults to 10.
														
 
															-            save_dir(str, optional): Directory to save the model. Defaults to 'output'.
														
 
															-            pretrain_weights(str or None, optional):
														
 
															-                None or name/path of pretrained weights. If None, no pretrained weights will be loaded. Defaults to 'IMAGENET'.
														
 
															-            learning_rate(float, optional): Learning rate for training. Defaults to .001.
														
 
															-            warmup_steps(int, optional): The number of steps of warm-up training. Defaults to 0.
														
 
															-            warmup_start_lr(float, optional): Start learning rate of warm-up training. Defaults to 0..
														
 
															-            lr_decay_epochs(list or tuple, optional): Epoch milestones for learning rate decay. Defaults to (216, 243).
														
 
															-            lr_decay_gamma(float, optional): Gamma coefficient of learning rate decay. Defaults to .1.
														
 
															-            metric({'VOC', 'COCO', None}, optional):
														
 
															-                Evaluation metric. If None, determine the metric according to the dataset format. Defaults to None.
														
 
															-            use_ema(bool, optional): Whether to use exponential moving average strategy. Defaults to False.
														
 
															-            early_stop(bool, optional): Whether to adopt early stop strategy. Defaults to False.
														
 
															-            early_stop_patience(int, optional): Early stop patience. Defaults to 5.
														
 
															-            use_vdl(bool, optional): Whether to use VisualDL to monitor the training process. Defaults to True.
														
 
															-            resume_checkpoint(str or None, optional): The path of the checkpoint to resume training from.
														
 
															-                If None, no training checkpoint will be resumed. At most one of `resume_checkpoint` and
														
 
															-                `pretrain_weights` can be set simultaneously. Defaults to None.
														
 
															+            num_epochs (int): Number of epochs.
														
 
															+            train_dataset (paddlers.datasets.COCODetDataset|paddlers.datasets.VOCDetDataset): 
														
 
															+                Training dataset.
														
 
															+            train_batch_size (int, optional): Total batch size among all cards used in 
														
 
															+                training. Defaults to 64.
														
 
															+            eval_dataset (paddlers.datasets.COCODetDataset|paddlers.datasets.VOCDetDataset, optional): 
														
 
															+                Evaluation dataset. If None, the model will not be evaluated during training 
														
 
															+                process. Defaults to None.
														
 
															+            optimizer (paddle.optimizer.Optimizer|None, optional): Optimizer used for 
														
 
															+                training. If None, a default optimizer will be used. Defaults to None.
														
 
															+            save_interval_epochs (int, optional): Epoch interval for saving the model. 
														
 
															+                Defaults to 1.
														
 
															+            log_interval_steps (int, optional): Step interval for printing training 
														
 
															+                information. Defaults to 10.
														
 
															+            save_dir (str, optional): Directory to save the model. Defaults to 'output'.
														
 
															+            pretrain_weights (str|None, optional): None or name/path of pretrained 
														
 
															+                weights. If None, no pretrained weights will be loaded. 
														
 
															+                Defaults to 'IMAGENET'.
														
 
															+            learning_rate (float, optional): Learning rate for training. Defaults to .001.
														
 
															+            warmup_steps (int, optional): Number of steps of warm-up training. 
														
 
															+                Defaults to 0.
														
 
															+            warmup_start_lr (float, optional): Start learning rate of warm-up training. 
														
 
															+                Defaults to 0..
														
 
															+            lr_decay_epochs (list|tuple, optional): Epoch milestones for learning 
														
 
															+                rate decay. Defaults to (216, 243).
														
 
															+            lr_decay_gamma (float, optional): Gamma coefficient of learning rate decay. 
														
 
															+                Defaults to .1.
														
 
															+            metric (str|None, optional): Evaluation metric. Choices are {'VOC', 'COCO', None}. 
														
 
															+                If None, determine the metric according to the  dataset format. 
														
 
															+                Defaults to None.
														
 
															+            use_ema (bool, optional): Whether to use exponential moving average 
														
 
															+                strategy. Defaults to False.
														
 
															+            early_stop (bool, optional): Whether to adopt early stop strategy. 
														
 
															+                Defaults to False.
														
 
															+            early_stop_patience (int, optional): Early stop patience. Defaults to 5.
														
 
															+            use_vdl(bool, optional): Whether to use VisualDL to monitor the training 
														
 
															+                process. Defaults to True.
														
 
															+            resume_checkpoint (str|None, optional): Path of the checkpoint to resume
														
 
															+                training from. If None, no training checkpoint will be resumed. At most
														
 
															+                Aone of `resume_checkpoint` and `pretrain_weights` can be set simultaneously.
														
 
															+                Defaults to None.
														
 
															         """
														
 
															+
														
 
															         if train_dataset.pos_num < len(train_dataset.file_list):
														
 
															             train_dataset.num_workers = 0
														
 
															         super(FasterRCNN, self).train(
														
@@ -1377,7 +1460,7 @@ class FasterRCNN(BaseDetector):
 
															         for i, op in enumerate(transforms.transforms):
														
 
															             if isinstance(op, (BatchRandomResize, BatchRandomResizeByShort)):
														
 
															                 if mode != 'train':
														
 
															-                    raise Exception(
														
 
															+                    raise ValueError(
														
 
															                         "{} cannot be present in the {} transforms. ".format(
														
 
															                             op.__class__.__name__, mode) +
														
 
															                         "Please check the {} transforms.".format(mode))
														
@@ -1456,7 +1539,7 @@ class PPYOLO(YOLOv3):
 
															         }:
														
 
															             raise ValueError(
														
 
															                 "backbone: {} is not supported. Please choose one of "
														
 
															-                "('ResNet50_vd_dcn', 'ResNet18_vd', 'MobileNetV3_large', 'MobileNetV3_small')".
														
 
															+                "{'ResNet50_vd_dcn', 'ResNet18_vd', 'MobileNetV3_large', 'MobileNetV3_small'}.".
														
 
															                 format(backbone))
														
 
															         self.backbone_name = backbone
														
 
															         self.downsample_ratios = [
														
@@ -1769,7 +1852,7 @@ class PPYOLOv2(YOLOv3):
 
															         if backbone not in {'ResNet50_vd_dcn', 'ResNet101_vd_dcn'}:
														
 
															             raise ValueError(
														
 
															                 "backbone: {} is not supported. Please choose one of "
														
 
															-                "('ResNet50_vd_dcn', 'ResNet101_vd_dcn')".format(backbone))
														
 
															+                "{'ResNet50_vd_dcn', 'ResNet101_vd_dcn'}.".format(backbone))
														
 
															         self.backbone_name = backbone
														
 
															         self.downsample_ratios = [32, 16, 8]
														
@@ -1916,7 +1999,7 @@ class MaskRCNN(BaseDetector):
 
															         }:
														
 
															             raise ValueError(
														
 
															                 "backbone: {} is not supported. Please choose one of "
														
 
															-                "('ResNet50', 'ResNet50_vd', 'ResNet50_vd_ssld', 'ResNet101', 'ResNet101_vd')".
														
 
															+                "{'ResNet50', 'ResNet50_vd', 'ResNet50_vd_ssld', 'ResNet101', 'ResNet101_vd'}.".
														
 
															                 format(backbone))
														
 
															         self.backbone_name = backbone + '_fpn' if with_fpn else backbone
														
@@ -2152,34 +2235,51 @@ class MaskRCNN(BaseDetector):
 
															               resume_checkpoint=None):
														
 
															         """
														
 
															         Train the model.
														
 
															+
														
 
															         Args:
														
 
															-            num_epochs(int): The number of epochs.
														
 
															-            train_dataset(paddlers.dataset): Training dataset.
														
 
															-            train_batch_size(int, optional): Total batch size among all cards used in training. Defaults to 64.
														
 
															-            eval_dataset(paddlers.dataset, optional):
														
 
															-                Evaluation dataset. If None, the model will not be evaluated during training process. Defaults to None.
														
 
															-            optimizer(paddle.optimizer.Optimizer or None, optional):
														
 
															-                Optimizer used for training. If None, a default optimizer is used. Defaults to None.
														
 
															-            save_interval_epochs(int, optional): Epoch interval for saving the model. Defaults to 1.
														
 
															-            log_interval_steps(int, optional): Step interval for printing training information. Defaults to 10.
														
 
															-            save_dir(str, optional): Directory to save the model. Defaults to 'output'.
														
 
															-            pretrain_weights(str or None, optional):
														
 
															-                None or name/path of pretrained weights. If None, no pretrained weights will be loaded. Defaults to 'IMAGENET'.
														
 
															-            learning_rate(float, optional): Learning rate for training. Defaults to .001.
														
 
															-            warmup_steps(int, optional): The number of steps of warm-up training. Defaults to 0.
														
 
															-            warmup_start_lr(float, optional): Start learning rate of warm-up training. Defaults to 0..
														
 
															-            lr_decay_epochs(list or tuple, optional): Epoch milestones for learning rate decay. Defaults to (216, 243).
														
 
															-            lr_decay_gamma(float, optional): Gamma coefficient of learning rate decay. Defaults to .1.
														
 
															-            metric({'VOC', 'COCO', None}, optional):
														
 
															-                Evaluation metric. If None, determine the metric according to the dataset format. Defaults to None.
														
 
															-            use_ema(bool, optional): Whether to use exponential moving average strategy. Defaults to False.
														
 
															-            early_stop(bool, optional): Whether to adopt early stop strategy. Defaults to False.
														
 
															-            early_stop_patience(int, optional): Early stop patience. Defaults to 5.
														
 
															-            use_vdl(bool, optional): Whether to use VisualDL to monitor the training process. Defaults to True.
														
 
															-            resume_checkpoint(str or None, optional): The path of the checkpoint to resume training from.
														
 
															-                If None, no training checkpoint will be resumed. At most one of `resume_checkpoint` and
														
 
															-                `pretrain_weights` can be set simultaneously. Defaults to None.
														
 
															+            num_epochs (int): Number of epochs.
														
 
															+            train_dataset (paddlers.datasets.COCODetDataset|paddlers.datasets.VOCDetDataset): 
														
 
															+                Training dataset.
														
 
															+            train_batch_size (int, optional): Total batch size among all cards used in 
														
 
															+                training. Defaults to 64.
														
 
															+            eval_dataset (paddlers.datasets.COCODetDataset|paddlers.datasets.VOCDetDataset, optional): 
														
 
															+                Evaluation dataset. If None, the model will not be evaluated during training 
														
 
															+                process. Defaults to None.
														
 
															+            optimizer (paddle.optimizer.Optimizer|None, optional): Optimizer used for 
														
 
															+                training. If None, a default optimizer will be used. Defaults to None.
														
 
															+            save_interval_epochs (int, optional): Epoch interval for saving the model. 
														
 
															+                Defaults to 1.
														
 
															+            log_interval_steps (int, optional): Step interval for printing training 
														
 
															+                information. Defaults to 10.
														
 
															+            save_dir (str, optional): Directory to save the model. Defaults to 'output'.
														
 
															+            pretrain_weights (str|None, optional): None or name/path of pretrained 
														
 
															+                weights. If None, no pretrained weights will be loaded. 
														
 
															+                Defaults to 'IMAGENET'.
														
 
															+            learning_rate (float, optional): Learning rate for training. Defaults to .001.
														
 
															+            warmup_steps (int, optional): Number of steps of warm-up training. 
														
 
															+                Defaults to 0.
														
 
															+            warmup_start_lr (float, optional): Start learning rate of warm-up training. 
														
 
															+                Defaults to 0..
														
 
															+            lr_decay_epochs (list|tuple, optional): Epoch milestones for learning 
														
 
															+                rate decay. Defaults to (216, 243).
														
 
															+            lr_decay_gamma (float, optional): Gamma coefficient of learning rate decay. 
														
 
															+                Defaults to .1.
														
 
															+            metric (str|None, optional): Evaluation metric. Choices are {'VOC', 'COCO', None}. 
														
 
															+                If None, determine the metric according to the  dataset format. 
														
 
															+                Defaults to None.
														
 
															+            use_ema (bool, optional): Whether to use exponential moving average 
														
 
															+                strategy. Defaults to False.
														
 
															+            early_stop (bool, optional): Whether to adopt early stop strategy. 
														
 
															+                Defaults to False.
														
 
															+            early_stop_patience (int, optional): Early stop patience. Defaults to 5.
														
 
															+            use_vdl(bool, optional): Whether to use VisualDL to monitor the training 
														
 
															+                process. Defaults to True.
														
 
															+            resume_checkpoint (str|None, optional): Path of the checkpoint to resume
														
 
															+                training from. If None, no training checkpoint will be resumed. At most
														
 
															+                Aone of `resume_checkpoint` and `pretrain_weights` can be set simultaneously.
														
 
															+                Defaults to None.
														
 
															         """
														
 
															+
														
 
															         if train_dataset.pos_num < len(train_dataset.file_list):
														
 
															             train_dataset.num_workers = 0
														
 
															         super(MaskRCNN, self).train(
														
@@ -2202,7 +2302,7 @@ class MaskRCNN(BaseDetector):
 
															         for i, op in enumerate(transforms.transforms):
														
 
															             if isinstance(op, (BatchRandomResize, BatchRandomResizeByShort)):
														
 
															                 if mode != 'train':
														
 
															-                    raise Exception(
														
 
															+                    raise ValueError(
														
 
															                         "{} cannot be present in the {} transforms. ".format(
														
 
															                             op.__class__.__name__, mode) +
														
 
															                         "Please check the {} transforms.".format(mode))
														
--- a/paddlers/tasks/segmenter.py
+++ b/paddlers/tasks/segmenter.py
@@ -228,29 +228,38 @@ class BaseSegmenter(BaseModel):
 
															               resume_checkpoint=None):
														
 
															         """
														
 
															         Train the model.
														
 
															-        Args:
														
 
															-            num_epochs(int): The number of epochs.
														
 
															-            train_dataset(paddlers.dataset): Training dataset.
														
 
															-            train_batch_size(int, optional): Total batch size among all cards used in training. Defaults to 2.
														
 
															-            eval_dataset(paddlers.dataset, optional):
														
 
															-                Evaluation dataset. If None, the model will not be evaluated furing training process. Defaults to None.
														
 
															-            optimizer(paddle.optimizer.Optimizer or None, optional):
														
 
															-                Optimizer used in training. If None, a default optimizer is used. Defaults to None.
														
 
															-            save_interval_epochs(int, optional): Epoch interval for saving the model. Defaults to 1.
														
 
															-            log_interval_steps(int, optional): Step interval for printing training information. Defaults to 10.
														
 
															-            save_dir(str, optional): Directory to save the model. Defaults to 'output'.
														
 
															-            pretrain_weights(str or None, optional):
														
 
															-                None or name/path of pretrained weights. If None, no pretrained weights will be loaded. Defaults to 'CITYSCAPES'.
														
 
															-            learning_rate(float, optional): Learning rate for training. Defaults to .025.
														
 
															-            lr_decay_power(float, optional): Learning decay power. Defaults to .9.
														
 
															-            early_stop(bool, optional): Whether to adopt early stop strategy. Defaults to False.
														
 
															-            early_stop_patience(int, optional): Early stop patience. Defaults to 5.
														
 
															-            use_vdl(bool, optional): Whether to use VisualDL to monitor the training process. Defaults to True.
														
 
															-            resume_checkpoint(str or None, optional): The path of the checkpoint to resume training from.
														
 
															-                If None, no training checkpoint will be resumed. At most one of `resume_checkpoint` and
														
 
															-                `pretrain_weights` can be set simultaneously. Defaults to None.
														
 
															+        Args:
														
 
															+            num_epochs (int): Number of epochs.
														
 
															+            train_dataset (paddlers.datasets.SegDataset): Training dataset.
														
 
															+            train_batch_size (int, optional): Total batch size among all cards used in 
														
 
															+                training. Defaults to 2.
														
 
															+            eval_dataset (paddlers.datasets.SegDataset|None, optional): Evaluation dataset. 
														
 
															+                If None, the model will not be evaluated during training process. 
														
 
															+                Defaults to None.
														
 
															+            optimizer (paddle.optimizer.Optimizer|None, optional): Optimizer used in 
														
 
															+                training. If None, a default optimizer will be used. Defaults to None.
														
 
															+            save_interval_epochs (int, optional): Epoch interval for saving the model. 
														
 
															+                Defaults to 1.
														
 
															+            log_interval_steps (int, optional): Step interval for printing training 
														
 
															+                information. Defaults to 2.
														
 
															+            save_dir (str, optional): Directory to save the model. Defaults to 'output'.
														
 
															+            pretrain_weights (str|None, optional): None or name/path of pretrained 
														
 
															+                weights. If None, no pretrained weights will be loaded. 
														
 
															+                Defaults to 'CITYSCAPES'.
														
 
															+            learning_rate (float, optional): Learning rate for training. Defaults to .025.
														
 
															+            lr_decay_power (float, optional): Learning decay power. Defaults to .9.
														
 
															+            early_stop (bool, optional): Whether to adopt early stop strategy. Defaults 
														
 
															+                to False.
														
 
															+            early_stop_patience (int, optional): Early stop patience. Defaults to 5.
														
 
															+            use_vdl (bool, optional): Whether to use VisualDL to monitor the training 
														
 
															+                process. Defaults to True.
														
 
															+            resume_checkpoint (str|None, optional): Path of the checkpoint to resume
														
 
															+                training from. If None, no training checkpoint will be resumed. At most
														
 
															+                Aone of `resume_checkpoint` and `pretrain_weights` can be set simultaneously.
														
 
															+                Defaults to None.
														
 
															         """
														
 
															+
														
 
															         if self.status == 'Infer':
														
 
															             logging.error(
														
 
															                 "Exported inference model does not support training.",
														
@@ -326,28 +335,37 @@ class BaseSegmenter(BaseModel):
 
															                           quant_config=None):
														
 
															         """
														
 
															         Quantization-aware training.
														
 
															-        Args:
														
 
															-            num_epochs(int): The number of epochs.
														
 
															-            train_dataset(paddlers.dataset): Training dataset.
														
 
															-            train_batch_size(int, optional): Total batch size among all cards used in training. Defaults to 2.
														
 
															-            eval_dataset(paddlers.dataset, optional):
														
 
															-                Evaluation dataset. If None, the model will not be evaluated furing training process. Defaults to None.
														
 
															-            optimizer(paddle.optimizer.Optimizer or None, optional):
														
 
															-                Optimizer used in training. If None, a default optimizer is used. Defaults to None.
														
 
															-            save_interval_epochs(int, optional): Epoch interval for saving the model. Defaults to 1.
														
 
															-            log_interval_steps(int, optional): Step interval for printing training information. Defaults to 10.
														
 
															-            save_dir(str, optional): Directory to save the model. Defaults to 'output'.
														
 
															-            learning_rate(float, optional): Learning rate for training. Defaults to .025.
														
 
															-            lr_decay_power(float, optional): Learning decay power. Defaults to .9.
														
 
															-            early_stop(bool, optional): Whether to adopt early stop strategy. Defaults to False.
														
 
															-            early_stop_patience(int, optional): Early stop patience. Defaults to 5.
														
 
															-            use_vdl(bool, optional): Whether to use VisualDL to monitor the training process. Defaults to True.
														
 
															-            quant_config(dict or None, optional): Quantization configuration. If None, a default rule of thumb
														
 
															-                configuration will be used. Defaults to None.
														
 
															-            resume_checkpoint(str or None, optional): The path of the checkpoint to resume quantization-aware training
														
 
															-                from. If None, no training checkpoint will be resumed. Defaults to None.
														
 
															+        Args:
														
 
															+            num_epochs (int): Number of epochs.
														
 
															+            train_dataset (paddlers.datasets.SegDataset): Training dataset.
														
 
															+            train_batch_size (int, optional): Total batch size among all cards used in 
														
 
															+                training. Defaults to 2.
														
 
															+            eval_dataset (paddlers.datasets.SegDataset|None, optional): Evaluation dataset.
														
 
															+                If None, the model will not be evaluated during training process. 
														
 
															+                Defaults to None.
														
 
															+            optimizer (paddle.optimizer.Optimizer|None, optional): Optimizer used in 
														
 
															+                training. If None, a default optimizer will be used. Defaults to None.
														
 
															+            save_interval_epochs (int, optional): Epoch interval for saving the model. 
														
 
															+                Defaults to 1.
														
 
															+            log_interval_steps (int, optional): Step interval for printing training 
														
 
															+                information. Defaults to 2.
														
 
															+            save_dir (str, optional): Directory to save the model. Defaults to 'output'.
														
 
															+            learning_rate (float, optional): Learning rate for training. 
														
 
															+                Defaults to .0001.
														
 
															+            lr_decay_power (float, optional): Learning decay power. Defaults to .9.
														
 
															+            early_stop (bool, optional): Whether to adopt early stop strategy. 
														
 
															+                Defaults to False.
														
 
															+            early_stop_patience (int, optional): Early stop patience. Defaults to 5.
														
 
															+            use_vdl (bool, optional): Whether to use VisualDL to monitor the training 
														
 
															+                process. Defaults to True.
														
 
															+            quant_config (dict|None, optional): Quantization configuration. If None, 
														
 
															+                a default rule of thumb configuration will be used. Defaults to None.
														
 
															+            resume_checkpoint (str|None, optional): Path of the checkpoint to resume
														
 
															+                quantization-aware training from. If None, no training checkpoint will
														
 
															+                be resumed. Defaults to None.
														
 
															         """
														
 
															+
														
 
															         self._prepare_qat(quant_config)
														
 
															         self.train(
														
 
															             num_epochs=num_epochs,
														
@@ -369,10 +387,13 @@ class BaseSegmenter(BaseModel):
 
															     def evaluate(self, eval_dataset, batch_size=1, return_details=False):
														
 
															         """
														
 
															         Evaluate the model.
														
 
															+
														
 
															         Args:
														
 
															-            eval_dataset(paddlers.dataset): Evaluation dataset.
														
 
															-            batch_size(int, optional): Total batch size among all cards used for evaluation. Defaults to 1.
														
 
															-            return_details(bool, optional): Whether to return evaluation details. Defaults to False.
														
 
															+            eval_dataset (paddlers.datasets.SegDataset): Evaluation dataset.
														
 
															+            batch_size (int, optional): Total batch size among all cards used for 
														
 
															+                evaluation. Defaults to 1.
														
 
															+            return_details (bool, optional): Whether to return evaluation details. 
														
 
															+                Defaults to False.
														
 
															         Returns:
														
 
															             collections.OrderedDict with key-value pairs:
														
@@ -384,6 +405,7 @@ class BaseSegmenter(BaseModel):
 
															                  "category_F1-score": `F1 score`}.
														
 
															         """
														
 
															+
														
 
															         self._check_transforms(eval_dataset.transforms, 'eval')
														
 
															         self.net.eval()
														
@@ -477,24 +499,27 @@ class BaseSegmenter(BaseModel):
 
															     def predict(self, img_file, transforms=None):
														
 
															         """
														
 
															         Do inference.
														
 
															+
														
 
															         Args:
														
 
															-            Args:
														
 
															-            img_file(list[np.ndarray | str] | str | np.ndarray):
														
 
															-                Image path or decoded image data, which also could constitute a list,meaning all images to be 
														
 
															+            img_file (list[np.ndarray|str] | str | np.ndarray): Image path or decoded 
														
 
															+                image data, which also could constitute a list, meaning all images to be 
														
 
															                 predicted as a mini-batch.
														
 
															-            transforms(paddlers.transforms.Compose or None, optional):
														
 
															-                Transforms for inputs. If None, the transforms for evaluation process will be used. Defaults to None.
														
 
															+            transforms (paddlers.transforms.Compose|None, optional): Transforms for 
														
 
															+                inputs. If None, the transforms for evaluation process will be used. 
														
 
															+                Defaults to None.
														
 
															         Returns:
														
 
															-            If img_file is a string or np.array, the result is a dict with key-value pairs:
														
 
															-            {"label map": `label map`, "score_map": `score map`}.
														
 
															-            If img_file is a list, the result is a list composed of dicts with the corresponding fields:
														
 
															-            label_map(np.ndarray): the predicted label map (HW)
														
 
															-            score_map(np.ndarray): the prediction score map (HWC)
														
 
															-
														
 
															+            If `img_file` is a string or np.array, the result is a dict with key-value 
														
 
															+                pairs:
														
 
															+                {"label map": `label map`, "score_map": `score map`}.
														
 
															+            If `img_file` is a list, the result is a list composed of dicts with the 
														
 
															+                corresponding fields:
														
 
															+                label_map (np.ndarray): the predicted label map (HW)
														
 
															+                score_map (np.ndarray): the prediction score map (HWC)
														
 
															         """
														
 
															+
														
 
															         if transforms is None and not hasattr(self, 'test_transforms'):
														
 
															-            raise Exception("transforms need to be defined, now is None.")
														
 
															+            raise ValueError("transforms need to be defined, now is None.")
														
 
															         if transforms is None:
														
 
															             transforms = self.test_transforms
														
 
															         if isinstance(img_file, (str, np.ndarray)):
														
@@ -528,19 +553,19 @@ class BaseSegmenter(BaseModel):
 
															                        transforms=None):
														
 
															         """
														
 
															         Do inference.
														
 
															+
														
 
															         Args:
														
 
															-            Args:
														
 
															-            img_file(str):
														
 
															-                Image path.
														
 
															-            save_dir(str):
														
 
															-                Directory that contains saved geotiff file.
														
 
															-            block_size(list[int] | tuple[int] | int):
														
 
															+            img_file (str): Image path.
														
 
															+            save_dir (str): Directory that contains saved geotiff file.
														
 
															+            block_size (list[int] | tuple[int] | int):
														
 
															                 Size of block.
														
 
															-            overlap(list[int] | tuple[int] | int, optional):
														
 
															+            overlap (list[int] | tuple[int] | int, optional):
														
 
															                 Overlap between two blocks. Defaults to 36.
														
 
															-            transforms(paddlers.transforms.Compose or None, optional):
														
 
															-                Transforms for inputs. If None, the transforms for evaluation process will be used. Defaults to None.
														
 
															+            transforms (paddlers.transforms.Compose|None, optional): Transforms for 
														
 
															+                inputs. If None, the transforms for evaluation process will be used. 
														
 
															+                Defaults to None.
														
 
															         """
														
 
															+
														
 
															         try:
														
 
															             from osgeo import gdal
														
 
															         except:
														
@@ -790,7 +815,7 @@ class DeepLabV3P(BaseSegmenter):
 
															         if backbone not in ['ResNet50_vd', 'ResNet101_vd']:
														
 
															             raise ValueError(
														
 
															                 "backbone: {} is not supported. Please choose one of "
														
 
															-                "('ResNet50_vd', 'ResNet101_vd')".format(backbone))
														
 
															+                "{'ResNet50_vd', 'ResNet101_vd'}.".format(backbone))
														
 
															         if params.get('with_net', True):
														
 
															             with DisablePrint():
														
 
															                 backbone = getattr(paddleseg.models, backbone)(
														
@@ -834,8 +859,8 @@ class HRNet(BaseSegmenter):
 
															                  **params):
														
 
															         if width not in (18, 48):
														
 
															             raise ValueError(
														
 
															-                "width={} is not supported, please choose from [18, 48]".format(
														
 
															-                    width))
														
 
															+                "width={} is not supported, please choose from {18, 48}.".
														
 
															+                format(width))
														
 
															         self.backbone_name = 'HRNet_W{}'.format(width)
														
 
															         if params.get('with_net', True):
														
 
															             with DisablePrint():
														
--- a/paddlers/tasks/utils/det_metrics/coco_utils.py
+++ b/paddlers/tasks/utils/det_metrics/coco_utils.py
@@ -71,13 +71,13 @@ def cocoapi_eval(anns,
 
															                  classwise=False):
														
 
															     """
														
 
															     Args:
														
 
															-        anns: Evaluation result.
														
 
															-        style (str): COCOeval style, can be `bbox` , `segm` and `proposal`.
														
 
															-        coco_gt (str): Whether to load COCOAPI through anno_file,
														
 
															+        anns (list): Evaluation result.
														
 
															+        style (str): COCOeval style. Choices are 'bbox', 'segm' and 'proposal'.
														
 
															+        coco_gt (str, optional): Whether to load COCOAPI through anno_file,
														
 
															                  eg: coco_gt = COCO(anno_file)
														
 
															-        anno_file (str): COCO annotations file.
														
 
															-        max_dets (tuple): COCO evaluation maxDets.
														
 
															-        classwise (bool): Whether per-category AP and draw P-R Curve or not.
														
 
															+        anno_file (str, optional): COCO annotations file. Defaults to None.
														
 
															+        max_dets (tuple, optional): COCO evaluation maxDets. Defaults to (100, 300, 1000).
														
 
															+        classwise (bool, optional): Whether to calculate per-category statistics or not. Defaults to None.
														
 
															     """
														
 
															     assert coco_gt is not None or anno_file is not None
														
@@ -148,12 +148,6 @@ def cocoapi_eval(anns,
 
															 def loadRes(coco_obj, anns):
														
 
															-    """
														
 
															-    Load result file and return a result api object.
														
 
															-    :param   resFile (str)     : file name of result file
														
 
															-    :return: res (obj)         : result api object
														
 
															-    """
														
 
															-
														
 
															     # This function has the same functionality as pycocotools.COCO.loadRes,
														
 
															     # except that the input anns is list of results rather than a json file.
														
 
															     # Refer to
														
@@ -294,7 +288,6 @@ def analyze_individual_category(k, cocoDt, cocoGt, catId, iou_type, areas=None):
 
															         int:
														
 
															         dict: 有关键字'ps_supercategory'和'ps_allcategory'。关键字'ps_supercategory'的键值是忽略亚类间
														
 
															             混淆时的准确率，关键字'ps_allcategory'的键值是忽略类别间混淆时的准确率。
														
 
															-
														
 
															     """
														
 
															     # matplotlib.use() must be called *before* pylab, matplotlib.pyplot,
														
@@ -402,13 +395,13 @@ def coco_error_analysis(eval_details_file=None,
 
															                 pred_mask = eval_details['mask']
														
 
															             gt = eval_details['gt']
														
 
															     if gt is None or pred_bbox is None:
														
 
															-        raise Exception(
														
 
															-            "gt/pred_bbox/pred_mask is None now, please set right eval_details_file or gt/pred_bbox/pred_mask."
														
 
															+        raise ValueError(
														
 
															+            "gt/pred_bbox/pred_mask is None now. Please set right eval_details_file or gt/pred_bbox/pred_mask."
														
 
															         )
														
 
															     if pred_bbox is not None and len(pred_bbox) == 0:
														
 
															-        raise Exception("There is no predicted bbox.")
														
 
															+        raise ValueError("There is no predicted bbox.")
														
 
															     if pred_mask is not None and len(pred_mask) == 0:
														
 
															-        raise Exception("There is no predicted mask.")
														
 
															+        raise ValueError("There is no predicted mask.")
														
 
															     def _analyze_results(cocoGt, cocoDt, res_type, out_dir):
														
 
															         """
														
@@ -474,4 +467,4 @@ def coco_error_analysis(eval_details_file=None,
 
															     if pred_mask is not None:
														
 
															         coco_dt = loadRes(coco_gt, pred_mask)
														
 
															         _analyze_results(coco_gt, coco_dt, res_type='segm', out_dir=save_dir)
														
 
															-    logging.info("The analysis figures are saved in {}".format(save_dir))
														
 
															+    logging.info("The analysis figures are saved in {}.".format(save_dir))
														
--- a/paddlers/tasks/utils/visualize.py
+++ b/paddlers/tasks/utils/visualize.py
@@ -50,11 +50,12 @@ def visualize_segmentation(image, result, weight=0.6, save_dir='./',
 
															     Convert segment result to color image, and save added image.
														
 
															     Args:
														
 
															-        image: the path of origin image
														
 
															-        result: the predict result of image
														
 
															-        weight: the image weight of visual image, and the result weight is (1 - weight)
														
 
															-        save_dir: the directory for saving visual image
														
 
															-        color: the list of a BGR-mode color for each label.
														
 
															+        image (str): Path of original image.
														
 
															+        result (dict): Predicted results.
														
 
															+        weight (float, optional): Weight used to mix the original image with the predicted image.
														
 
															+            Defaults to 0.6.
														
 
															+        save_dir (str, optional): Directory for saving visualized image. Defaults to './'.
														
 
															+        color (list|None): None or list of BGR indices for each label. Defaults to None.
														
 
															     """
														
 
															     label_map = result['label_map'].astype("uint8")
														
@@ -106,14 +107,15 @@ def visualize_segmentation(image, result, weight=0.6, save_dir='./',
 
															 def get_color_map_list(num_classes):
														
 
															-    """ 
														
 
															-    Returns the color map for visualizing the segmentation mask, which can support arbitrary number of classes.
														
 
															+    """
														
 
															+    Get the color map for visualizing a segmentation mask.
														
 
															+    This function supports arbitrary number of classes.
														
 
															     Args:
														
 
															-        num_classes: Number of classes
														
 
															+        num_classes (int): Number of classes.
														
 
															     Returns:
														
 
															-        The color map
														
 
															+        list: Color map.
														
 
															     """
														
 
															     color_map = num_classes * [0, 0, 0]
														
@@ -130,10 +132,10 @@ def get_color_map_list(num_classes):
 
															     return color_map
														
 
															-# expand an array of boxes by a given scale.
														
 
															 def expand_boxes(boxes, scale):
														
 
															     """
														
 
															-        """
														
 
															+    Expand an array of boxes by a given scale.
														
 
															+    """
														
 
															     w_half = (boxes[:, 2] - boxes[:, 0]) * .5
														
 
															     h_half = (boxes[:, 3] - boxes[:, 1]) * .5
														
 
															     x_c = (boxes[:, 2] + boxes[:, 0]) * .5
														
@@ -175,7 +177,7 @@ def draw_bbox_mask(image, results, threshold=0.5, color_map=None):
 
															     else:
														
 
															         color_map = np.asarray(color_map)
														
 
															         if color_map.shape[0] != len(labels) or color_map.shape[1] != 3:
														
 
															-            raise Exception(
														
 
															+            raise ValueError(
														
 
															                 "The shape for color_map is required to be {}x3, but recieved shape is {}x{}.".
														
 
															                 format(len(labels), color_map.shape))
														
 
															         if np.max(color_map) > 255 or np.min(color_map) < 0:
														
@@ -203,11 +205,11 @@ def draw_bbox_mask(image, results, threshold=0.5, color_map=None):
 
															         ymax = ymin + h
														
 
															         color = tuple(map(int, color_map[labels.index(cname)]))
														
 
															-        # draw bbox
														
 
															+        # Draw bbox
														
 
															         image = cv2.rectangle(image, (xmin, ymin), (xmax, ymax), color,
														
 
															                               linewidth)
														
 
															-        # draw mask
														
 
															+        # Draw mask
														
 
															         if 'mask' in dt:
														
 
															             mask = dt['mask'] * 255
														
 
															             image = image.astype('float32')
														
@@ -230,7 +232,7 @@ def draw_bbox_mask(image, results, threshold=0.5, color_map=None):
 
															                 thickness=1,
														
 
															                 lineType=cv2.LINE_AA)
														
 
															-        # draw label
														
 
															+        # Draw label
														
 
															         text_pos = (xmin, ymin)
														
 
															         instance_area = w * h
														
 
															         if (instance_area < _SMALL_OBJECT_AREA_THRESH or h < 40):
														
@@ -279,13 +281,13 @@ def draw_pr_curve(eval_details_file=None,
 
															                 pred_mask = eval_details['mask']
														
 
															             gt = eval_details['gt']
														
 
															     if gt is None or pred_bbox is None:
														
 
															-        raise Exception(
														
 
															+        raise ValueError(
														
 
															             "gt/pred_bbox/pred_mask is None now, please set right eval_details_file or gt/pred_bbox/pred_mask."
														
 
															         )
														
 
															     if pred_bbox is not None and len(pred_bbox) == 0:
														
 
															-        raise Exception("There is no predicted bbox.")
														
 
															+        raise ValueError("There is no predicted bbox.")
														
 
															     if pred_mask is not None and len(pred_mask) == 0:
														
 
															-        raise Exception("There is no predicted mask.")
														
 
															+        raise ValueError("There is no predicted mask.")
														
 
															     import matplotlib
														
 
															     matplotlib.use('Agg')
														
 
															     import matplotlib.pyplot as plt
														
@@ -297,7 +299,8 @@ def draw_pr_curve(eval_details_file=None,
 
															     def _summarize(coco_gt, ap=1, iouThr=None, areaRng='all', maxDets=100):
														
 
															         """
														
 
															-        This function has the same functionality as _summarize() in pycocotools.COCOeval.summarize().
														
 
															+        This function has the same functionality as _summarize() in 
														
 
															+            pycocotools.COCOeval.summarize().
														
 
															         Refer to
														
 
															         https://github.com/cocodataset/cocoapi/blob/8c9bcc3cf640524c4c20a9c40e89cb6a2f2fa0e9/PythonAPI/pycocotools/cocoeval.py#L427,
														
@@ -336,7 +339,7 @@ def draw_pr_curve(eval_details_file=None,
 
															         stats = _summarize(coco_eval, iouThr=iou_thresh)
														
 
															         catIds = coco_gt.getCatIds()
														
 
															         if len(catIds) != coco_eval.eval['precision'].shape[2]:
														
 
															-            raise Exception(
														
 
															+            raise ValueError(
														
 
															                 "The category number must be same as the third dimension of precisions."
														
 
															             )
														
 
															         x = np.arange(0.0, 1.01, 0.01)
														
--- a/paddlers/tools/yolo_cluster.py
+++ b/paddlers/tools/yolo_cluster.py
@@ -30,9 +30,9 @@ class BaseAnchorCluster(object):
 
															         Base Anchor Cluster
														
 
															         Args:
														
 
															-            num_anchors (int): number of clusters
														
 
															-            cache (bool): whether using cache
														
 
															-            cache_path (str): cache directory path
														
 
															+            num_anchors (int): Number of clusters.
														
 
															+            cache (bool): Whether to use cache.
														
 
															+            cache_path (str): Cache directory path.
														
 
															         """
														
 
															         super(BaseAnchorCluster, self).__init__()
														
 
															         self.num_anchors = num_anchors
														
@@ -99,14 +99,15 @@ class YOLOAnchorCluster(BaseAnchorCluster):
 
															             https://github.com/ultralytics/yolov5/blob/master/utils/autoanchor.py
														
 
															         Args:
														
 
															-            num_anchors (int): number of clusters
														
 
															-            dataset (DataSet): DataSet instance, VOC or COCO
														
 
															-            image_size (list or int): [h, w], being an int means image height and image width are the same.
														
 
															-            cache (bool): whether using cache. Defaults to True.
														
 
															-            cache_path (str or None, optional): cache directory path. If None, use `data_dir` of dataset. Defaults to None.
														
 
															-            iters (int, optional): iters of kmeans algorithm. Defaults to 300.
														
 
															-            gen_iters (int, optional): iters of genetic algorithm. Defaults to 1000.
														
 
															-            thresh (float, optional): anchor scale threshold. Defaults to 0.25.
														
 
															+            num_anchors (int): Number of clusters.
														
 
															+            dataset (paddlers.datasets.COCODetDataset|paddlers.datasets.VOCDetDataset): Dataset instance.
														
 
															+            image_size (list[int] | int): [h, w] or an int value that corresponds to the shape [image_size, image_size].
														
 
															+            cache (bool, optional): Whether to use cache. Defaults to True.
														
 
															+            cache_path (str|None, optional): Path of cache directory. If None, use `dataset.data_dir`. 
														
 
															+                Defaults to None.
														
 
															+            iters (int, optional): Iterations of k-means algorithm. Defaults to 300.
														
 
															+            gen_iters (int, optional): Iterations of genetic algorithm. Defaults to 1000.
														
 
															+            thresh (float, optional): Anchor scale threshold. Defaults to 0.25.
														
 
															         """
														
 
															         self.dataset = dataset
														
 
															         if cache_path is None:
														
--- a/paddlers/transforms/__init__.py
+++ b/paddlers/transforms/__init__.py
@@ -29,14 +29,16 @@ def decode_image(im_path,
 
															     Decode an image.
														
 
															     Args:
														
 
															-        im_path (str): Path of the image to decode.
														
 
															-        to_rgb (bool, optional): If True, convert input image(s) from BGR format to RGB format. Defaults to True.
														
 
															-        to_uint8 (bool, optional): If True, quantize and convert decoded image(s) to uint8 type. Defaults to True.
														
 
															-        decode_bgr (bool, optional): If True, automatically interpret a non-geo image (e.g. jpeg images) as a BGR image. 
														
 
															-            Defaults to True.
														
 
															-        decode_sar (bool, optional): If True, automatically interpret a two-channel geo image (e.g. geotiff images) as a 
														
 
															-            SAR image, set this argument to True. Defaults to True.
														
 
															-
														
 
															+        to_rgb (bool, optional): If True, convert input image(s) from BGR format to 
														
 
															+            RGB format. Defaults to True.
														
 
															+        to_uint8 (bool, optional): If True, quantize and convert decoded image(s) to 
														
 
															+            uint8 type. Defaults to True.
														
 
															+        decode_bgr (bool, optional): If True, automatically interpret a non-geo 
														
 
															+            image (e.g. jpeg images) as a BGR image. Defaults to True.
														
 
															+        decode_sar (bool, optional): If True, automatically interpret a two-channel 
														
 
															+            geo image (e.g. geotiff images) as a SAR image, set this argument to 
														
 
															+            True. Defaults to True.
														
 
															+    
														
 
															     Returns:
														
 
															         np.ndarray: Decoded image.
														
 
															     """
														
--- a/paddlers/transforms/batch_operators.py
+++ b/paddlers/transforms/batch_operators.py
@@ -72,17 +72,18 @@ class BatchCompose(Transform):
 
															 class BatchRandomResize(Transform):
														
 
															     """
														
 
															-    Resize a batch of input to random sizes.
														
 
															+    Resize a batch of inputs to random sizes.
														
 
															-    Attention: If interp is 'RANDOM', the interpolation method will be chose randomly.
														
 
															+    Attention: If `interp` is 'RANDOM', the interpolation method will be chosen randomly.
														
 
															     Args:
														
 
															-        target_sizes (list[int] | list[list | tuple] | tuple[list | tuple]):
														
 
															-            Multiple target sizes, each target size is an int or list/tuple of length 2.
														
 
															-        interp ({'NEAREST', 'LINEAR', 'CUBIC', 'AREA', 'LANCZOS4', 'RANDOM'}, optional):
														
 
															-            Interpolation method of resize. Defaults to 'LINEAR'.
														
 
															+        target_sizes (list[int] | list[list|tuple] | tuple[list|tuple]):
														
 
															+            Multiple target sizes, each of which should be an int or list/tuple of length 2.
														
 
															+        interp (str, optional): Interpolation method for resizing image(s). One of 
														
 
															+            {'NEAREST', 'LINEAR', 'CUBIC', 'AREA', 'LANCZOS4', 'RANDOM'}. 
														
 
															+            Defaults to 'LINEAR'.
														
 
															     Raises:
														
 
															-        TypeError: Invalid type of target_size.
														
 
															+        TypeError: Invalid type of `target_size`.
														
 
															         ValueError: Invalid interpolation method.
														
 
															     See Also:
														
@@ -111,23 +112,27 @@ class BatchRandomResize(Transform):
 
															 class BatchRandomResizeByShort(Transform):
														
 
															-    """Resize a batch of input to random sizes with keeping the aspect ratio.
														
 
															+    """
														
 
															+    Resize a batch of inputs to random sizes while keeping the aspect ratio.
														
 
															-    Attention: If interp is 'RANDOM', the interpolation method will be chose randomly.
														
 
															+    Attention: If `interp` is 'RANDOM', the interpolation method will be chosen randomly.
														
 
															     Args:
														
 
															-        short_sizes (list[int] | tuple[int]): Target sizes of the shorter side of the image(s).
														
 
															-        max_size (int, optional): The upper bound of longer side of the image(s).
														
 
															-            If max_size is -1, no upper bound is applied. Defaults to -1.
														
 
															-        interp ({'NEAREST', 'LINEAR', 'CUBIC', 'AREA', 'LANCZOS4', 'RANDOM'}, optional):
														
 
															-            Interpolation method of resize. Defaults to 'LINEAR'.
														
 
															+        short_sizes (list[int] | tuple[int]): Target sizes of the shorter side of 
														
 
															+            the image(s).
														
 
															+        max_size (int, optional): Upper bound of longer side of the image(s).
														
 
															+            If `max_size` is -1, no upper bound will be applied. Defaults to -1.
														
 
															+        interp (str, optional): Interpolation method for resizing image(s). One of 
														
 
															+            {'NEAREST', 'LINEAR', 'CUBIC', 'AREA', 'LANCZOS4', 'RANDOM'}. 
														
 
															+            Defaults to 'LINEAR'.
														
 
															     Raises:
														
 
															-        TypeError: Invalid type of target_size.
														
 
															+        TypeError: Invalid type of `target_size`.
														
 
															         ValueError: Invalid interpolation method.
														
 
															     See Also:
														
 
															-        RandomResizeByShort: Resize input to random sizes with keeping the aspect ratio.
														
 
															+        RandomResizeByShort: Resize input to random sizes while keeping the aspect 
														
 
															+            ratio.
														
 
															     """
														
 
															     def __init__(self, short_sizes, max_size=-1, interp='NEAREST'):
														
@@ -180,7 +185,7 @@ class _BatchPad(Transform):
 
															 class _Gt2YoloTarget(Transform):
														
 
															     """
														
 
															     Generate YOLOv3 targets by groud truth data, this operator is only used in
														
 
															-    fine grained YOLOv3 loss mode
														
 
															+        fine grained YOLOv3 loss mode.
														
 
															     """
														
 
															     def __init__(self,
														
--- a/paddlers/transforms/functions.py
+++ b/paddlers/transforms/functions.py
@@ -58,75 +58,73 @@ def center_crop(im, crop_size=224):
 
															 # region flip
														
 
															 def img_flip(im, method=0):
														
 
															     """
														
 
															-    flip image in different ways, this function provides 5 method to filp
														
 
															-    this function can be applied to 2D or 3D images
														
 
															+    Flip an image. 
														
 
															+    This function provides 5 flipping methods and can be applied to 2D or 3D numpy arrays.
														
 
															     Args:
														
 
															-        im(array): image array
														
 
															-        method(int or string): choose the flip method, it must be one of [
														
 
															-                                0, 1, 2, 3, 4, 'h', 'v', 'hv', 'rt2lb', 'lt2rb', 'dia', 'adia']
														
 
															-        0 or 'h': flipped in horizontal direction, which is the most frequently used method
														
 
															-        1 or 'v': flipped in vertical direction
														
 
															-        2 or 'hv': flipped in both horizontal diction and vertical direction
														
 
															-        3 or 'rt2lb' or 'dia': flipped around the diagonal,
														
 
															-                                which also can be thought as changing the RightTop part with LeftBottom part,
														
 
															-                                so it is called 'rt2lb' as well.
														
 
															-        4 or 'lt2rb' or 'adia': flipped around the anti-diagonal
														
 
															-                                    which also can be thought as changing the LeftTop part with RightBottom part,
														
 
															-                                    so it is called 'lt2rb' as well.
														
 
															+        im (np.ndarray): Input image.
														
 
															+        method (int|string): Flipping method. Must be one of [
														
 
															+                                0, 1, 2, 3, 4, 'h', 'v', 'hv', 'rt2lb', 'lt2rb', 
														
 
															+                                'dia', 'adia'].
														
 
															+            0 or 'h': flip the image in horizontal direction, which is the most frequently 
														
 
															+                used method;
														
 
															+            1 or 'v': flip the image in vertical direction;
														
 
															+            2 or 'hv': flip the image in both horizontal diction and vertical direction;
														
 
															+            3 or 'rt2lb' or 'dia': flip the image across the diagonal;
														
 
															+            4 or 'lt2rb' or 'adia': flip the image across the anti-diagonal.
														
 
															     Returns:
														
 
															-        flipped image(array)
														
 
															+        np.ndarray: Flipped image.
														
 
															     Raises:
														
 
															-        ValueError: Shape of image should 2d, 3d or more.
														
 
															+        ValueError: Invalid shape of images.
														
 
															     Examples:
														
 
															-        --assume an image is like this:
														
 
															+        Assume an image is like this:
														
 
															         img:
														
 
															         / + +
														
 
															         - / *
														
 
															         - * /
														
 
															-        --we can flip it in following code:
														
 
															+        We can flip it with following code:
														
 
															-        img_h = im_flip(img, 'h')
														
 
															-        img_v = im_flip(img, 'v')
														
 
															-        img_vh = im_flip(img, 2)
														
 
															-        img_rt2lb = im_flip(img, 3)
														
 
															-        img_lt2rb = im_flip(img, 4)
														
 
															+        img_h = img_flip(img, 'h')
														
 
															+        img_v = img_flip(img, 'v')
														
 
															+        img_vh = img_flip(img, 2)
														
 
															+        img_rt2lb = img_flip(img, 3)
														
 
															+        img_lt2rb = img_flip(img, 4)
														
 
															-        --we can get flipped image:
														
 
															+        Then we get the flipped images:
														
 
															-        img_h, flipped in horizontal direction
														
 
															+        img_h, flipped in horizontal direction:
														
 
															         + + \
														
 
															         * \ -
														
 
															         \ * -
														
 
															-        img_v, flipped in vertical direction
														
 
															+        img_v, flipped in vertical direction:
														
 
															         - * \
														
 
															         - \ *
														
 
															         \ + +
														
 
															-        img_vh, flipped in both horizontal diction and vertical direction
														
 
															+        img_vh, flipped in both horizontal diction and vertical direction:
														
 
															         / * -
														
 
															         * / -
														
 
															         + + /
														
 
															-        img_rt2lb, flipped around the diagonal
														
 
															+        img_rt2lb, mirrored on the diagonal:
														
 
															         / | |
														
 
															         + / *
														
 
															         + * /
														
 
															-        img_lt2rb, flipped around the anti-diagonal
														
 
															+        img_lt2rb, mirrored on the anti-diagonal:
														
 
															         / * +
														
 
															         * / +
														
 
															         | | /
														
 
															-
														
 
															     """
														
 
															+
														
 
															     if not len(im.shape) >= 2:
														
 
															-        raise ValueError("Shape of image should 2d, 3d or more")
														
 
															+        raise ValueError("The number of image dimensions is less than 2.")
														
 
															     if method == 0 or method == 'h':
														
 
															         return horizontal_flip(im)
														
 
															     elif method == 1 or method == 'v':
														
@@ -176,61 +174,58 @@ def lt2rb_flip(im):
 
															 # region rotation
														
 
															 def img_simple_rotate(im, method=0):
														
 
															     """
														
 
															-    rotate image in simple ways, this function provides 3 method to rotate
														
 
															-    this function can be applied to 2D or 3D images
														
 
															+    Rotate an image. 
														
 
															+    This function provides 3 rotating methods and can be applied to 2D or 3D numpy arrays.
														
 
															     Args:
														
 
															-        im(array): image array
														
 
															-        method(int or string): choose the flip method, it must be one of [
														
 
															+        im (np.ndarray): Input image.
														
 
															+        method (int|string): Rotating method, which must be one of [
														
 
															                                 0, 1, 2, 90, 180, 270
														
 
															-                                ]
														
 
															-        0 or 90 : rotated in 90 degree, clockwise
														
 
															-        1 or 180: rotated in 180 degree, clockwise
														
 
															-        2 or 270: rotated in 270 degree, clockwise
														
 
															+                                ].
														
 
															+            0 or 90 : rotate the image by 90 degrees, clockwise;
														
 
															+            1 or 180: rotate the image by 180 degrees, clockwise;
														
 
															+            2 or 270: rotate the image by 270 degrees, clockwise.
														
 
															     Returns:
														
 
															-        flipped image(array)
														
 
															-
														
 
															+        np.ndarray: Rotated image.
														
 
															     Raises:
														
 
															-        ValueError: Shape of image should 2d, 3d or more.
														
 
															-
														
 
															+        ValueError: Invalid shape of images.
														
 
															     Examples:
														
 
															-        --assume an image is like this:
														
 
															+        Assume an image is like this:
														
 
															         img:
														
 
															         / + +
														
 
															         - / *
														
 
															         - * /
														
 
															-        --we can rotate it in following code:
														
 
															+        We can rotate it with following code:
														
 
															         img_r90 = img_simple_rotate(img, 90)
														
 
															         img_r180 = img_simple_rotate(img, 1)
														
 
															         img_r270 = img_simple_rotate(img, 2)
														
 
															-        --we can get rotated image:
														
 
															+        Then we get the following rotated images:
														
 
															-        img_r90, rotated in 90 degree
														
 
															+        img_r90, rotated by 90°:
														
 
															         | | \
														
 
															         * \ +
														
 
															         \ * +
														
 
															-        img_r180, rotated in 180 degree
														
 
															+        img_r180, rotated by 180°:
														
 
															         / * -
														
 
															         * / -
														
 
															         + + /
														
 
															-        img_r270, rotated in 270 degree
														
 
															+        img_r270, rotated by 270°:
														
 
															         + * \
														
 
															         + \ *
														
 
															         \ | |
														
 
															-
														
 
															-
														
 
															     """
														
 
															+
														
 
															     if not len(im.shape) >= 2:
														
 
															-        raise ValueError("Shape of image should 2d, 3d or more")
														
 
															+        raise ValueError("The number of image dimensions is less than 2.")
														
 
															     if method == 0 or method == 90:
														
 
															         return rot_90(im)
														
 
															     elif method == 1 or method == 180:
														
@@ -396,14 +391,15 @@ def resize_rle(rle, im_h, im_w, im_scale_x, im_scale_y, interp):
 
															 def to_uint8(im, is_linear=False):
														
 
															-    """ Convert raster to uint8.
														
 
															+    """
														
 
															+    Convert raster data to uint8 type.
														
 
															     Args:
														
 
															-        im (np.ndarray): The image.
														
 
															+        im (np.ndarray): Input raster image.
														
 
															         is_linear (bool, optional): Use 2% linear stretch or not. Default is False.
														
 
															     Returns:
														
 
															-        np.ndarray: Image on uint8.
														
 
															+        np.ndarray: Image data with unit8 type.
														
 
															     """
														
 
															     # 2% linear stretch
														
@@ -448,16 +444,18 @@ def to_uint8(im, is_linear=False):
 
															 def to_intensity(im):
														
 
															-    """ calculate SAR data's intensity diagram.
														
 
															+    """
														
 
															+    Calculate the intensity of SAR data.
														
 
															     Args:
														
 
															-        im (np.ndarray): The SAR image.
														
 
															+        im (np.ndarray): SAR image.
														
 
															     Returns:
														
 
															-        np.ndarray: Intensity diagram.
														
 
															+        np.ndarray: Intensity image.
														
 
															     """
														
 
															+
														
 
															     if len(im.shape) != 2:
														
 
															-        raise ValueError("im's shape must be 2.")
														
 
															+        raise ValueError("`len(im.shape) must be 2.")
														
 
															     # the type is complex means this is a SAR data
														
 
															     if isinstance(type(im[0, 0]), complex):
														
 
															         im = abs(im)
														
@@ -465,15 +463,18 @@ def to_intensity(im):
 
															 def select_bands(im, band_list=[1, 2, 3]):
														
 
															-    """ Select bands.
														
 
															+    """
														
 
															+    Select bands of a multi-band image.
														
 
															     Args:
														
 
															-        im (np.ndarray): The image.
														
 
															-        band_list (list, optional): Bands of selected (Start with 1). Defaults to [1, 2, 3].
														
 
															+        im (np.ndarray): Input image.
														
 
															+        band_list (list, optional): Bands to select (band index start from 1). 
														
 
															+            Defaults to [1, 2, 3].
														
 
															     Returns:
														
 
															-        np.ndarray: The image after band selected.
														
 
															+        np.ndarray: Image with selected bands.
														
 
															     """
														
 
															+
														
 
															     if len(im.shape) == 2:  # just have one channel
														
 
															         return im
														
 
															     if not isinstance(band_list, list) or len(band_list) == 0:
														
@@ -492,14 +493,14 @@ def select_bands(im, band_list=[1, 2, 3]):
 
															 def dehaze(im, gamma=False):
														
 
															     """
														
 
															-    Single image haze removal using dark channel prior.
														
 
															+    Perform single image haze removal using dark channel prior.
														
 
															     Args:
														
 
															         im (np.ndarray): Input image.
														
 
															         gamma (bool, optional): Use gamma correction or not. Defaults to False.
														
 
															     Returns:
														
 
															-        np.ndarray: The image after dehazed.
														
 
															+        np.ndarray: Output dehazed image.
														
 
															     """
														
 
															     def _guided_filter(I, p, r, eps):
														
@@ -549,7 +550,8 @@ def match_histograms(im, ref):
 
															     Args:
														
 
															         im (np.ndarray): Input image.
														
 
															-        ref (np.ndarray): Reference image to match histogram of. `ref` must have the same number of channels as `im`.
														
 
															+        ref (np.ndarray): Reference image to match histogram of. `ref` must have 
														
 
															+            the same number of channels as `im`.
														
 
															     Returns:
														
 
															         np.ndarray: Transformed input image.
														
@@ -557,6 +559,7 @@ def match_histograms(im, ref):
 
															     Raises:
														
 
															         ValueError: When the number of channels of `ref` differs from that of im`.
														
 
															     """
														
 
															+
														
 
															     # TODO: Check the data types of the inputs to see if they are supported by skimage
														
 
															     return exposure.match_histograms(
														
 
															         im, ref, channel_axis=-1 if im.ndim > 2 else None)
														
@@ -568,10 +571,12 @@ def match_by_regression(im, ref, pif_loc=None):
 
															     Args:
														
 
															         im (np.ndarray): Input image.
														
 
															-        ref (np.ndarray): Reference image to match. `ref` must have the same shape as `im`.
														
 
															-        pif_loc (tuple|None, optional): Spatial locations where pseudo-invariant features (PIFs) are obtained. If 
														
 
															-            `pif_loc` is set to None, all pixels in the image will be used as training samples for the regression model. 
														
 
															-            In other cases, `pif_loc` should be a tuple of np.ndarrays. Default: None.
														
 
															+        ref (np.ndarray): Reference image to match. `ref` must have the same shape 
														
 
															+            as `im`.
														
 
															+        pif_loc (tuple|None, optional): Spatial locations where pseudo-invariant 
														
 
															+            features (PIFs) are obtained. If `pif_loc` is set to None, all pixels in 
														
 
															+            the image will be used as training samples for the regression model. In 
														
 
															+            other cases, `pif_loc` should be a tuple of np.ndarrays. Default: None.
														
 
															     Returns:
														
 
															         np.ndarray: Transformed input image.
														
@@ -609,15 +614,16 @@ def match_by_regression(im, ref, pif_loc=None):
 
															 def inv_pca(im, joblib_path):
														
 
															     """
														
 
															-    Restore PCA result.
														
 
															+    Perform inverse PCA transformation.
														
 
															     Args:
														
 
															-        im (np.ndarray): The input image after PCA.
														
 
															-        joblib_path (str): Path of *.joblib about PCA.
														
 
															+        im (np.ndarray): Input image after performing PCA.
														
 
															+        joblib_path (str): Path of *.joblib file that stores PCA information.
														
 
															     Returns:
														
 
															-        np.ndarray: The raw input image.
														
 
															+        np.ndarray: Reconstructed input image.
														
 
															     """
														
 
															+
														
 
															     pca = load(joblib_path)
														
 
															     H, W, C = im.shape
														
 
															     n_im = np.reshape(im, (-1, C))
														
--- a/paddlers/transforms/operators.py
+++ b/paddlers/transforms/operators.py
@@ -123,7 +123,7 @@ class Compose(object):
 
															 class Transform(object):
														
 
															     """
														
 
															-    Parent class of all data augmentation operations
														
 
															+    Parent class of all data augmentation operators.
														
 
															     """
														
 
															     def __init__(self):
														
@@ -171,12 +171,15 @@ class DecodeImg(Transform):
 
															     Decode image(s) in input.
														
 
															     Args:
														
 
															-        to_rgb (bool, optional): If True, convert input image(s) from BGR format to RGB format. Defaults to True.
														
 
															-        to_uint8 (bool, optional): If True, quantize and convert decoded image(s) to uint8 type. Defaults to True.
														
 
															-        decode_bgr (bool, optional): If True, automatically interpret a non-geo image (e.g., jpeg images) as a BGR image. 
														
 
															-            Defaults to True.
														
 
															-        decode_sar (bool, optional): If True, automatically interpret a two-channel geo image (e.g. geotiff images) as a 
														
 
															-            SAR image, set this argument to True. Defaults to True.
														
 
															+        to_rgb (bool, optional): If True, convert input image(s) from BGR format to 
														
 
															+            RGB format. Defaults to True.
														
 
															+        to_uint8 (bool, optional): If True, quantize and convert decoded image(s) to 
														
 
															+            uint8 type. Defaults to True.
														
 
															+        decode_bgr (bool, optional): If True, automatically interpret a non-geo image 
														
 
															+            (e.g., jpeg images) as a BGR image. Defaults to True.
														
 
															+        decode_sar (bool, optional): If True, automatically interpret a two-channel 
														
 
															+            geo image (e.g. geotiff images) as a SAR image, set this argument to 
														
 
															+            True. Defaults to True.
														
 
															     """
														
 
															     def __init__(self,
														
@@ -262,7 +265,7 @@ class DecodeImg(Transform):
 
															             sample (dict): Input sample.
														
 
															         Returns:
														
 
															-            dict: Decoded sample.
														
 
															+            dict: Sample with decoded images.
														
 
															         """
														
 
															         if 'image' in sample:
														
@@ -299,17 +302,20 @@ class Resize(Transform):
 
															     """
														
 
															     Resize input.
														
 
															-    - If target_size is an int, resize the image(s) to (target_size, target_size).
														
 
															-    - If target_size is a list or tuple, resize the image(s) to target_size.
														
 
															-    Attention: If interp is 'RANDOM', the interpolation method will be chose randomly.
														
 
															+    - If `target_size` is an int, resize the image(s) to (`target_size`, `target_size`).
														
 
															+    - If `target_size` is a list or tuple, resize the image(s) to `target_size`.
														
 
															+    Attention: If `interp` is 'RANDOM', the interpolation method will be chosen randomly.
														
 
															     Args:
														
 
															-        target_size (int, list[int] | tuple[int]): Target size. If int, the height and width share the same target_size.
														
 
															-            Otherwise, target_size represents [target height, target width].
														
 
															-        interp ({'NEAREST', 'LINEAR', 'CUBIC', 'AREA', 'LANCZOS4', 'RANDOM'}, optional):
														
 
															-            Interpolation method of resize. Defaults to 'LINEAR'.
														
 
															-        keep_ratio (bool): the resize scale of width/height is same and width/height after resized is not greater
														
 
															-            than target width/height. Defaults to False.
														
 
															+        target_size (int | list[int] | tuple[int]): Target size. If it is an integer, the
														
 
															+            target height and width will be both set to `target_size`. Otherwise, 
														
 
															+            `target_size` represents [target height, target width].
														
 
															+        interp (str, optional): Interpolation method for resizing image(s). One of 
														
 
															+            {'NEAREST', 'LINEAR', 'CUBIC', 'AREA', 'LANCZOS4', 'RANDOM'}. 
														
 
															+            Defaults to 'LINEAR'.
														
 
															+        keep_ratio (bool, optional): If True, the scaling factor of width and height will 
														
 
															+            be set to same value, and height/width of the resized image will be not 
														
 
															+            greater than the target width/height. Defaults to False.
														
 
															     Raises:
														
 
															         TypeError: Invalid type of target_size.
														
@@ -420,20 +426,18 @@ class RandomResize(Transform):
 
															     """
														
 
															     Resize input to random sizes.
														
 
															-    Attention: If interp is 'RANDOM', the interpolation method will be chose randomly.
														
 
															+    Attention: If `interp` is 'RANDOM', the interpolation method will be chosen randomly.
														
 
															     Args:
														
 
															-        target_sizes (list[int] | list[list | tuple] | tuple[list | tuple]):
														
 
															-            Multiple target sizes, each target size is an int or list/tuple.
														
 
															-        interp ({'NEAREST', 'LINEAR', 'CUBIC', 'AREA', 'LANCZOS4', 'RANDOM'}, optional):
														
 
															-            Interpolation method of resize. Defaults to 'LINEAR'.
														
 
															+        target_sizes (list[int] | list[list|tuple] | tuple[list|tuple]):
														
 
															+            Multiple target sizes, each of which should be int, list, or tuple.
														
 
															+        interp (str, optional): Interpolation method for resizing image(s). One of 
														
 
															+            {'NEAREST', 'LINEAR', 'CUBIC', 'AREA', 'LANCZOS4', 'RANDOM'}. 
														
 
															+            Defaults to 'LINEAR'.
														
 
															     Raises:
														
 
															-        TypeError: Invalid type of target_size.
														
 
															+        TypeError: Invalid type of `target_size`.
														
 
															         ValueError: Invalid interpolation method.
														
 
															-
														
 
															-    See Also:
														
 
															-        Resize input to a specific size.
														
 
															     """
														
 
															     def __init__(self, target_sizes, interp='LINEAR'):
														
@@ -459,14 +463,17 @@ class RandomResize(Transform):
 
															 class ResizeByShort(Transform):
														
 
															     """
														
 
															-    Resize input with keeping the aspect ratio.
														
 
															+    Resize input while keeping the aspect ratio.
														
 
															-    Attention: If interp is 'RANDOM', the interpolation method will be chose randomly.
														
 
															+    Attention: If `interp` is 'RANDOM', the interpolation method will be chosen randomly.
														
 
															     Args:
														
 
															         short_size (int): Target size of the shorter side of the image(s).
														
 
															-        max_size (int, optional): The upper bound of longer side of the image(s). If max_size is -1, no upper bound is applied. Defaults to -1.
														
 
															-        interp ({'NEAREST', 'LINEAR', 'CUBIC', 'AREA', 'LANCZOS4', 'RANDOM'}, optional): Interpolation method of resize. Defaults to 'LINEAR'.
														
 
															+        max_size (int, optional): Upper bound of longer side of the image(s). If
														
 
															+            `max_size` is -1, no upper bound will be applied. Defaults to -1.
														
 
															+        interp (str, optional): Interpolation method for resizing image(s). One of 
														
 
															+            {'NEAREST', 'LINEAR', 'CUBIC', 'AREA', 'LANCZOS4', 'RANDOM'}. 
														
 
															+            Defaults to 'LINEAR'.
														
 
															     Raises:
														
 
															         ValueError: Invalid interpolation method.
														
@@ -498,21 +505,24 @@ class ResizeByShort(Transform):
 
															 class RandomResizeByShort(Transform):
														
 
															     """
														
 
															-    Resize input to random sizes with keeping the aspect ratio.
														
 
															+    Resize input to random sizes while keeping the aspect ratio.
														
 
															-    Attention: If interp is 'RANDOM', the interpolation method will be chose randomly.
														
 
															+    Attention: If `interp` is 'RANDOM', the interpolation method will be chosen randomly.
														
 
															     Args:
														
 
															         short_sizes (list[int]): Target size of the shorter side of the image(s).
														
 
															-        max_size (int, optional): The upper bound of longer side of the image(s). If max_size is -1, no upper bound is applied. Defaults to -1.
														
 
															-        interp ({'NEAREST', 'LINEAR', 'CUBIC', 'AREA', 'LANCZOS4', 'RANDOM'}, optional): Interpolation method of resize. Defaults to 'LINEAR'.
														
 
															+        max_size (int, optional): Upper bound of longer side of the image(s). 
														
 
															+            If `max_size` is -1, no upper bound will be applied. Defaults to -1.
														
 
															+        interp (str, optional): Interpolation method for resizing image(s). One of 
														
 
															+            {'NEAREST', 'LINEAR', 'CUBIC', 'AREA', 'LANCZOS4', 'RANDOM'}. 
														
 
															+            Defaults to 'LINEAR'.
														
 
															     Raises:
														
 
															-        TypeError: Invalid type of target_size.
														
 
															+        TypeError: Invalid type of `target_size`.
														
 
															         ValueError: Invalid interpolation method.
														
 
															     See Also:
														
 
															-        ResizeByShort: Resize image(s) in input with keeping the aspect ratio.
														
 
															+        ResizeByShort: Resize image(s) in input while keeping the aspect ratio.
														
 
															     """
														
 
															     def __init__(self, short_sizes, max_size=-1, interp='LINEAR'):
														
@@ -555,29 +565,30 @@ class ResizeByLong(Transform):
 
															 class RandomFlipOrRotate(Transform):
														
 
															     """
														
 
															-    Flip or Rotate an image in different ways with a certain probability.
														
 
															+    Flip or Rotate an image in different directions with a certain probability.
														
 
															     Args:
														
 
															-        probs (list of float): Probabilities of flipping and rotation. Default: [0.35,0.25].
														
 
															-        probsf (list of float): Probabilities of 5 flipping mode
														
 
															-                                (horizontal, vertical, both horizontal diction and vertical, diagonal, anti-diagonal).
														
 
															-                                Default: [0.3, 0.3, 0.2, 0.1, 0.1].
														
 
															-        probsr (list of float): Probabilities of 3 rotation mode(90°, 180°, 270° clockwise). Default: [0.25,0.5,0.25].
														
 
															+        probs (list[float]): Probabilities of performing flipping and rotation. 
														
 
															+            Default: [0.35,0.25].
														
 
															+        probsf (list[float]): Probabilities of 5 flipping modes (horizontal, 
														
 
															+            vertical, both horizontal diction and vertical, diagonal, 
														
 
															+            anti-diagonal). Default: [0.3, 0.3, 0.2, 0.1, 0.1].
														
 
															+        probsr (list[float]): Probabilities of 3 rotation modes (90°, 180°, 270° 
														
 
															+            clockwise). Default: [0.25,0.5,0.25].
														
 
															     Examples:
														
 
															         from paddlers import transforms as T
														
 
															-        # 定义数据增强
														
 
															+        # Define operators for data augmentation
														
 
															         train_transforms = T.Compose([
														
 
															             T.DecodeImg(),
														
 
															             T.RandomFlipOrRotate(
														
 
															-                probs  = [0.3, 0.2]             # 进行flip增强的概率是0.3，进行rotate增强的概率是0.2，不变的概率是0.5
														
 
															-                probsf = [0.3, 0.25, 0, 0, 0]   # flip增强时，使用水平flip、垂直flip的概率分别是0.3、0.25，水平且垂直flip、对角线flip、反对角线flip概率均为0，不变的概率是0.45
														
 
															-                probsr = [0, 0.65, 0]),         # rotate增强时，顺时针旋转90度的概率是0，顺时针旋转180度的概率是0.65，顺时针旋转90度的概率是0，不变的概率是0.35
														
 
															-            T.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225])
														
 
															+                probs  = [0.3, 0.2]             # p=0.3 to flip the image，p=0.2 to rotate the image，p=0.5 to keep the image unchanged.
														
 
															+                probsf = [0.3, 0.25, 0, 0, 0]   # p=0.3 and p=0.25 to perform horizontal and vertical flipping; probility of no-flipping is 0.45.
														
 
															+                probsr = [0, 0.65, 0]),         # p=0.65 to rotate the image by 180°; probility of no-rotation is 0.35.
														
 
															+            T.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225]),
														
 
															         ])
														
 
															-
														
 
															     """
														
 
															     def __init__(self,
														
@@ -615,15 +626,16 @@ class RandomFlipOrRotate(Transform):
 
															         )
														
 
															     def get_probs_range(self, probs):
														
 
															-        '''
														
 
															-        Change various probabilities into cumulative probabilities
														
 
															+        """
														
 
															+        Change list of probabilities into cumulative probability intervals.
														
 
															         Args:
														
 
															-            probs(list of float): probabilities of different mode, shape:[n]
														
 
															+            probs (list[float]): Probabilities of different modes, shape: [n].
														
 
															         Returns:
														
 
															-            probability intervals(list of binary list): shape:[n, 2]
														
 
															-        '''
														
 
															+            list[list]: Probability intervals, shape: [n, 2].
														
 
															+        """
														
 
															+
														
 
															         ps = []
														
 
															         last_prob = 0
														
 
															         for prob in probs:
														
@@ -635,17 +647,17 @@ class RandomFlipOrRotate(Transform):
 
															         return ps
														
 
															     def judge_probs_range(self, p, probs):
														
 
															-        '''
														
 
															-        Judge whether a probability value falls within the given probability interval
														
 
															+        """
														
 
															+        Judge whether the value of `p` falls within the given probability interval.
														
 
															         Args:
														
 
															-            p(float): probability
														
 
															-            probs(list of binary list): probability intervals, shape:[n, 2]
														
 
															+            p (float): Value between 0 and 1.
														
 
															+            probs (list[list]): Probability intervals, shape: [n, 2].
														
 
															         Returns:
														
 
															-            mode id(int):the probability interval number where the input probability falls,
														
 
															-                         if return -1, the image will remain as it is and will not be processed
														
 
															-        '''
														
 
															+            int: Interval where the input probability falls into.
														
 
															+        """
														
 
															+
														
 
															         for id, id_range in enumerate(probs):
														
 
															             if p > id_range[0] and p < id_range[1]:
														
 
															                 return id
														
@@ -702,7 +714,7 @@ class RandomHorizontalFlip(Transform):
 
															     Randomly flip the input horizontally.
														
 
															     Args:
														
 
															-        prob(float, optional): Probability of flipping the input. Defaults to .5.
														
 
															+        prob (float, optional): Probability of flipping the input. Defaults to .5.
														
 
															     """
														
 
															     def __init__(self, prob=0.5):
														
@@ -760,7 +772,7 @@ class RandomVerticalFlip(Transform):
 
															     Randomly flip the input vertically.
														
 
															     Args:
														
 
															-        prob(float, optional): Probability of flipping the input. Defaults to .5.
														
 
															+        prob (float, optional): Probability of flipping the input. Defaults to .5.
														
 
															     """
														
 
															     def __init__(self, prob=0.5):
														
@@ -821,10 +833,14 @@ class Normalize(Transform):
 
															     3. im = im / std
														
 
															     Args:
														
 
															-        mean(list[float] | tuple[float], optional): Mean of input image(s). Defaults to [0.485, 0.456, 0.406].
														
 
															-        std(list[float] | tuple[float], optional): Standard deviation of input image(s). Defaults to [0.229, 0.224, 0.225].
														
 
															-        min_val(list[float] | tuple[float], optional): Minimum value of input image(s). Defaults to [0, 0, 0, ].
														
 
															-        max_val(list[float] | tuple[float], optional): Max value of input image(s). Defaults to [255., 255., 255.].
														
 
															+        mean (list[float] | tuple[float], optional): Mean of input image(s). 
														
 
															+            Defaults to [0.485, 0.456, 0.406].
														
 
															+        std (list[float] | tuple[float], optional): Standard deviation of input 
														
 
															+            image(s). Defaults to [0.229, 0.224, 0.225].
														
 
															+        min_val (list[float] | tuple[float], optional): Minimum value of input 
														
 
															+            image(s). Defaults to [0, 0, 0, ].
														
 
															+        max_val (list[float] | tuple[float], optional): Max value of input image(s). 
														
 
															+            Defaults to [255., 255., 255.].
														
 
															     """
														
 
															     def __init__(self,
														
@@ -872,12 +888,13 @@ class Normalize(Transform):
 
															 class CenterCrop(Transform):
														
 
															     """
														
 
															-    Crop the input at the center.
														
 
															+    Crop the input image(s) at the center.
														
 
															     1. Locate the center of the image.
														
 
															-    2. Crop the sample.
														
 
															+    2. Crop the image.
														
 
															     Args:
														
 
															-        crop_size(int, optional): target size of the cropped image(s). Defaults to 224.
														
 
															+        crop_size (int, optional): Target size of the cropped image(s). 
														
 
															+            Defaults to 224.
														
 
															     """
														
 
															     def __init__(self, crop_size=224):
														
@@ -908,22 +925,27 @@ class CenterCrop(Transform):
 
															 class RandomCrop(Transform):
														
 
															     """
														
 
															     Randomly crop the input.
														
 
															-    1. Compute the height and width of cropped area according to aspect_ratio and scaling.
														
 
															+    1. Compute the height and width of cropped area according to `aspect_ratio` and 
														
 
															+        `scaling`.
														
 
															     2. Locate the upper left corner of cropped area randomly.
														
 
															     3. Crop the image(s).
														
 
															-    4. Resize the cropped area to crop_size by crop_size.
														
 
															+    4. Resize the cropped area to `crop_size` x `crop_size`.
														
 
															     Args:
														
 
															-        crop_size(int, list[int] | tuple[int]): Target size of the cropped area. If None, the cropped area will not be
														
 
															-            resized. Defaults to None.
														
 
															-        aspect_ratio (list[float], optional): Aspect ratio of cropped region in [min, max] format. Defaults to [.5, 2.].
														
 
															-        thresholds (list[float], optional): Iou thresholds to decide a valid bbox crop.
														
 
															-            Defaults to [.0, .1, .3, .5, .7, .9].
														
 
															-        scaling (list[float], optional): Ratio between the cropped region and the original image in [min, max] format.
														
 
															-            Defaults to [.3, 1.].
														
 
															-        num_attempts (int, optional): The number of tries before giving up. Defaults to 50.
														
 
															-        allow_no_crop (bool, optional): Whether returning without doing crop is allowed. Defaults to True.
														
 
															-        cover_all_box (bool, optional): Whether to ensure all bboxes are covered in the final crop. Defaults to False.
														
 
															+        crop_size (int | list[int] | tuple[int]): Target size of the cropped area. If 
														
 
															+            None, the cropped area will not be resized. Defaults to None.
														
 
															+        aspect_ratio (list[float], optional): Aspect ratio of cropped region in 
														
 
															+            [min, max] format. Defaults to [.5, 2.].
														
 
															+        thresholds (list[float], optional): Iou thresholds to decide a valid bbox 
														
 
															+            crop. Defaults to [.0, .1, .3, .5, .7, .9].
														
 
															+        scaling (list[float], optional): Ratio between the cropped region and the 
														
 
															+            original image in [min, max] format. Defaults to [.3, 1.].
														
 
															+        num_attempts (int, optional): Max number of tries before giving up. 
														
 
															+            Defaults to 50.
														
 
															+        allow_no_crop (bool, optional): Whether returning without doing crop is 
														
 
															+            allowed. Defaults to True.
														
 
															+        cover_all_box (bool, optional): Whether to ensure all bboxes be covered in 
														
 
															+            the final crop. Defaults to False.
														
 
															     """
														
 
															     def __init__(self,
														
@@ -1107,9 +1129,10 @@ class RandomCrop(Transform):
 
															 class RandomScaleAspect(Transform):
														
 
															     """
														
 
															     Crop input image(s) and resize back to original sizes.
														
 
															+
														
 
															     Args: 
														
 
															-        min_scale (float): Minimum ratio between the cropped region and the original image.
														
 
															-            If 0, image(s) will not be cropped. Defaults to .5.
														
 
															+        min_scale (float): Minimum ratio between the cropped region and the original
														
 
															+            image. If 0, image(s) will not be cropped. Defaults to .5.
														
 
															         aspect_ratio (float): Aspect ratio of cropped region. Defaults to .33.
														
 
															     """
														
@@ -1135,10 +1158,13 @@ class RandomExpand(Transform):
 
															     Randomly expand the input by padding according to random offsets.
														
 
															     Args:
														
 
															-        upper_ratio(float, optional): The maximum ratio to which the original image is expanded. Defaults to 4..
														
 
															-        prob(float, optional): The probability of apply expanding. Defaults to .5.
														
 
															-        im_padding_value(list[float] | tuple[float], optional): RGB filling value for the image. Defaults to (127.5, 127.5, 127.5).
														
 
															-        label_padding_value(int, optional): Filling value for the mask. Defaults to 255.
														
 
															+        upper_ratio (float, optional): Maximum ratio to which the original image 
														
 
															+            is expanded. Defaults to 4..
														
 
															+        prob (float, optional): Probability of apply expanding. Defaults to .5.
														
 
															+        im_padding_value (list[float] | tuple[float], optional): RGB filling value 
														
 
															+            for the image. Defaults to (127.5, 127.5, 127.5).
														
 
															+        label_padding_value (int, optional): Filling value for the mask. 
														
 
															+            Defaults to 255.
														
 
															     See Also:
														
 
															         paddlers.transforms.Pad
														
@@ -1187,15 +1213,20 @@ class Pad(Transform):
 
															                  label_padding_value=255,
														
 
															                  size_divisor=32):
														
 
															         """
														
 
															-        Pad image to a specified size or multiple of size_divisor.
														
 
															+        Pad image to a specified size or multiple of `size_divisor`.
														
 
															         Args:
														
 
															-            target_size(int, Sequence, optional): Image target size, if None, pad to multiple of size_divisor. Defaults to None.
														
 
															-            pad_mode({-1, 0, 1, 2}, optional): Pad mode, currently only supports four modes [-1, 0, 1, 2]. if -1, use specified offsets
														
 
															-                if 0, only pad to right and bottom. If 1, pad according to center. If 2, only pad left and top. Defaults to 0.
														
 
															-            im_padding_value(Sequence[float]): RGB value of pad area. Defaults to (127.5, 127.5, 127.5).
														
 
															-            label_padding_value(int, optional): Filling value for the mask. Defaults to 255.
														
 
															-            size_divisor(int): Image width and height after padding is a multiple of coarsest_stride.
														
 
															+            target_size (list[int] | tuple[int], optional): Image target size, if None, pad to 
														
 
															+                multiple of size_divisor. Defaults to None.
														
 
															+            pad_mode (int, optional): Pad mode. Currently only four modes are supported:
														
 
															+                [-1, 0, 1, 2]. if -1, use specified offsets. If 0, only pad to right and bottom
														
 
															+                If 1, pad according to center. If 2, only pad left and top. Defaults to 0.
														
 
															+            im_padding_value (list[float] | tuple[float]): RGB value of padded area. 
														
 
															+                Defaults to (127.5, 127.5, 127.5).
														
 
															+            label_padding_value (int, optional): Filling value for the mask. 
														
 
															+                Defaults to 255.
														
 
															+            size_divisor (int): Image width and height after padding will be a multiple of 
														
 
															+                `size_divisor`.
														
 
															         """
														
 
															         super(Pad, self).__init__()
														
 
															         if isinstance(target_size, (list, tuple)):
														
@@ -1306,8 +1337,10 @@ class MixupImage(Transform):
 
															         Mixup two images and their gt_bbbox/gt_score.
														
 
															         Args:
														
 
															-            alpha (float, optional): Alpha parameter of beta distribution. Defaults to 1.5.
														
 
															-            beta (float, optional): Beta parameter of beta distribution. Defaults to 1.5.
														
 
															+            alpha (float, optional): Alpha parameter of beta distribution. 
														
 
															+                Defaults to 1.5.
														
 
															+            beta (float, optional): Beta parameter of beta distribution. 
														
 
															+                Defaults to 1.5.
														
 
															         """
														
 
															         super(MixupImage, self).__init__()
														
 
															         if alpha <= 0.0:
														
@@ -1385,18 +1418,25 @@ class RandomDistort(Transform):
 
															     Random color distortion.
														
 
															     Args:
														
 
															-        brightness_range(float, optional): Range of brightness distortion. Defaults to .5.
														
 
															-        brightness_prob(float, optional): Probability of brightness distortion. Defaults to .5.
														
 
															-        contrast_range(float, optional): Range of contrast distortion. Defaults to .5.
														
 
															-        contrast_prob(float, optional): Probability of contrast distortion. Defaults to .5.
														
 
															-        saturation_range(float, optional): Range of saturation distortion. Defaults to .5.
														
 
															-        saturation_prob(float, optional): Probability of saturation distortion. Defaults to .5.
														
 
															-        hue_range(float, optional): Range of hue distortion. Defaults to .5.
														
 
															-        hue_prob(float, optional): Probability of hue distortion. Defaults to .5.
														
 
															-        random_apply (bool, optional): whether to apply in random (yolo) or fixed (SSD)
														
 
															-            order. Defaults to True.
														
 
															-        count (int, optional): the number of doing distortion. Defaults to 4.
														
 
															-        shuffle_channel (bool, optional): whether to swap channels randomly. Defaults to False.
														
 
															+        brightness_range (float, optional): Range of brightness distortion. 
														
 
															+            Defaults to .5.
														
 
															+        brightness_prob (float, optional): Probability of brightness distortion. 
														
 
															+            Defaults to .5.
														
 
															+        contrast_range (float, optional): Range of contrast distortion. 
														
 
															+            Defaults to .5.
														
 
															+        contrast_prob (float, optional): Probability of contrast distortion. 
														
 
															+            Defaults to .5.
														
 
															+        saturation_range (float, optional): Range of saturation distortion. 
														
 
															+            Defaults to .5.
														
 
															+        saturation_prob (float, optional): Probability of saturation distortion. 
														
 
															+            Defaults to .5.
														
 
															+        hue_range (float, optional): Range of hue distortion. Defaults to .5.
														
 
															+        hue_prob (float, optional): Probability of hue distortion. Defaults to .5.
														
 
															+        random_apply (bool, optional): Apply the transformation in random (yolo) or
														
 
															+            fixed (SSD) order. Defaults to True.
														
 
															+        count (int, optional): Number of distortions to apply. Defaults to 4.
														
 
															+        shuffle_channel (bool, optional): Whether to swap channels randomly. 
														
 
															+            Defaults to False.
														
 
															     """
														
 
															     def __init__(self,
														
@@ -1632,7 +1672,8 @@ class SelectBand(Transform):
 
															     Select a set of bands of input image(s).
														
 
															     Args: 
														
 
															-        band_list (list, optional): Bands to select (the band index starts with 1). Defaults to [1, 2, 3].
														
 
															+        band_list (list, optional): Bands to select (band index starts from 1). 
														
 
															+            Defaults to [1, 2, 3].
														
 
															     """
														
 
															     def __init__(self, band_list=[1, 2, 3]):
														
@@ -1653,11 +1694,12 @@ class SelectBand(Transform):
 
															 class _PadBox(Transform):
														
 
															     def __init__(self, num_max_boxes=50):
														
 
															         """
														
 
															-        Pad zeros to bboxes if number of bboxes is less than num_max_boxes.
														
 
															+        Pad zeros to bboxes if number of bboxes is less than `num_max_boxes`.
														
 
															         Args:
														
 
															-            num_max_boxes (int, optional): the max number of bboxes. Defaults to 50.
														
 
															+            num_max_boxes (int, optional): Max number of bboxes. Defaults to 50.
														
 
															         """
														
 
															+
														
 
															         self.num_max_boxes = num_max_boxes
														
 
															         super(_PadBox, self).__init__()
														
@@ -1741,7 +1783,8 @@ class RandomSwap(Transform):
 
															     Randomly swap multi-temporal images.
														
 
															     Args:
														
 
															-        prob (float, optional): Probability of swapping the input images. Default: 0.2.
														
 
															+        prob (float, optional): Probability of swapping the input images. 
														
 
															+            Default: 0.2.
														
 
															     """
														
 
															     def __init__(self, prob=0.2):
														
--- a/paddlers/utils/download.py
+++ b/paddlers/utils/download.py
@@ -50,8 +50,7 @@ def md5check(fullname, md5sum=None):
 
															 def move_and_merge_tree(src, dst):
														
 
															     """
														
 
															-    Move src directory to dst, if dst is already exists,
														
 
															-    merge src to dst
														
 
															+    Move `src` to `dst`. If `dst` already exists, merge `src` with `dst`.
														
 
															     """
														
 
															     if not osp.exists(dst):
														
 
															         shutil.move(src, dst)
														
@@ -71,10 +70,10 @@ def move_and_merge_tree(src, dst):
 
															 def download(url, path, md5sum=None):
														
 
															     """
														
 
															-    Download from url, save to path.
														
 
															+    Download from `url` and save the result to `path`.
														
 
															-    url (str): download url
														
 
															-    path (str): download to given path
														
 
															+    url (str): URL.
														
 
															+    path (str): Path to save the downloaded result.
														
 
															     """
														
 
															     if not osp.exists(path):
														
 
															         os.makedirs(path)
														
@@ -136,7 +135,7 @@ def download(url, path, md5sum=None):
 
															 def decompress(fname):
														
 
															     """
														
 
															-    Decompress for zip and tar file
														
 
															+    Decompress zip or tar files.
														
 
															     """
														
 
															     logging.info("Decompressing {}...".format(fname))
														
--- a/paddlers/utils/env.py
+++ b/paddlers/utils/env.py
@@ -22,7 +22,9 @@ import paddle
 
															 def get_environ_info():
														
 
															-    """collect environment information"""
														
 
															+    """
														
 
															+    Collect environment information.
														
 
															+    """
														
 
															     env_info = dict()
														
 
															     # TODO is_compiled_with_cuda() has not been moved
														
--- a/paddlers/utils/stats.py
+++ b/paddlers/utils/stats.py
@@ -19,8 +19,8 @@ import numpy as np
 
															 class SmoothedValue(object):
														
 
															-    """Track a series of values and provide access to smoothed values over a
														
 
															-    window.
														
 
															+    """
														
 
															+    Track a series of values and provide access to smoothed values over window.
														
 
															     """
														
 
															     def __init__(self, window_size=20):
														
--- a/paddlers/utils/utils.py
+++ b/paddlers/utils/utils.py
@@ -53,9 +53,9 @@ def get_single_card_bs(batch_size):
 
															         # Evaluation of detection task only supports single card with batch size 1
														
 
															         return batch_size
														
 
															     else:
														
 
															-        raise Exception("Please support correct batch_size, \
														
 
															+        raise ValueError("Please support correct batch_size, \
														
 
															                         which can be divided by available cards({}) in {}"
														
 
															-                        .format(card_num, place))
														
 
															+                         .format(card_num, place))
														
 
															 def dict2str(dict_input):
														
@@ -113,7 +113,7 @@ class EarlyStop:
 
															         self.max = 0
														
 
															         self.thresh = thresh
														
 
															         if patience < 1:
														
 
															-            raise Exception("Argument patience should be a positive integer.")
														
 
															+            raise ValueError("Argument patience should be a positive integer.")
														
 
															     def __call__(self, current_score):
														
 
															         if self.score is None:
														
--- a/tests/data/data_utils.py
+++ b/tests/data/data_utils.py
@@ -332,7 +332,7 @@ def build_input_from_file(file_list, prefix='', task='auto', label_list=None):
 
															         prefix (str, optional): A nonempty `prefix` specifies the directory that stores the images and annotation files. Default: ''.
														
 
															         task (str, optional): Supported values are 'seg', 'det', 'cd', 'clas', and 'auto'. When `task` is set to 'auto', automatically determine the task based on the input. 
														
 
															             Default: 'auto'.
														
 
															-        label_list (str | None, optional): Path of label_list. Default: None.
														
 
															+        label_list (str|None, optional): Path of label_list. Default: None.
														
 
															     Returns:
														
 
															         list: List of samples.
														
--- a/tests/testing_utils.py
+++ b/tests/testing_utils.py
@@ -118,7 +118,7 @@ class _CommonTestNamespace:
 
															                 assertForFloat = self.assertTrue
														
 
															             result_t = type(result)
														
 
															-            error_msg = 'Output has diff at place:{}. \nExpect: {} \nBut Got: {} in class {}'
														
 
															+            error_msg = "Output has diff at place:{}. \nExpect: {} \nBut Got: {} in class {}"
														
 
															             if result_t in [list, tuple]:
														
 
															                 result_t = get_container_type(result)
														
 
															             if result_t in [
														
@@ -144,8 +144,8 @@ class _CommonTestNamespace:
 
															                             result.shape, self.__class__.__name__))
														
 
															             else:
														
 
															                 raise ValueError(
														
 
															-                    'result type must be str, int, bool, set, np.bool, np.int32, '
														
 
															-                    'np.int64, np.str, float, np.ndarray, np.float32, np.float64'
														
 
															+                    "result type must be str, int, bool, set, np.bool, np.int32, "
														
 
															+                    "np.int64, np.str, float, np.ndarray, np.float32, np.float64"
														
 
															                 )
														
 
															         def check_output_equal(self,
														
@@ -157,13 +157,13 @@ class _CommonTestNamespace:
 
															             Check whether result and expected result are equal, including shape. 
														
 
															             Args:
														
 
															-                result: str, int, bool, set, np.ndarray.
														
 
															+                result (str|int|bool|set|np.ndarray):
														
 
															                     The result needs to be checked.
														
 
															-                expected_result: str, int, bool, set, np.ndarray. The type has to be same as result's.
														
 
															-                    Use the expected result to check result.
														
 
															-                rtol: float
														
 
															+                expected_result (str|int|bool|set|np.ndarray): The type has to be same as
														
 
															+                    result's. Use the expected result to check result.
														
 
															+                rtol (float, optional):
														
 
															                     relative tolerance, default 1.e-5.
														
 
															-                atol: float
														
 
															+                atol (float, optional):
														
 
															                     absolute tolerance, default 1.e-8
														
 
															             """
														
@@ -178,13 +178,13 @@ class _CommonTestNamespace:
 
															             Check whether result and expected result are not equal, including shape. 
														
 
															             Args:
														
 
															-                result: str, int, bool, set, np.ndarray.
														
 
															+                result (str|int|bool|set|np.ndarray):
														
 
															                     The result needs to be checked.
														
 
															-                expected_result: str, int, bool, set, np.ndarray. The type has to be same as result's.
														
 
															-                    Use the expected result to check result.
														
 
															-                rtol: float
														
 
															+                expected_result (str|int|bool|set|np.ndarray): The type has to be same 
														
 
															+                    as result's. Use the expected result to check result.
														
 
															+                rtol (float, optional):
														
 
															                     relative tolerance, default 1.e-5.
														
 
															-                atol: float
														
 
															+                atol (float, optional):
														
 
															                     absolute tolerance, default 1.e-8
														
 
															             """
														
--- a/tools/coco_tools/json_AnnoSta.py
+++ b/tools/coco_tools/json_AnnoSta.py
@@ -11,7 +11,7 @@
 
															 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
														
 
															 # See the License for the specific language governing permissions and
														
 
															 # limitations under the License.
														
 
															-'''
														
 
															+"""
														
 
															 @File Description:
														
 
															 # json文件annotations信息，生成统计结果csv，对象框shape、对象看shape比例、对象框起始位置、对象结束位置、对象结束位置、对象类别、单个图像对象数量的分布
														
 
															 python ./coco_tools/json_AnnoSta.py \
														
@@ -24,7 +24,8 @@ python ./coco_tools/json_AnnoSta.py \
 
															     --png_cat_path=./anno_sta/annos_cat.png \
														
 
															     --png_objNum_path=./anno_sta/annos_objNum.png \
														
 
															     --get_relative=True
														
 
															-'''
														
 
															+"""
														
 
															+
														
 
															 import os
														
 
															 import json
														
 
															 import argparse
														
--- a/tools/coco_tools/json_Img2Json.py
+++ b/tools/coco_tools/json_Img2Json.py
@@ -11,14 +11,15 @@
 
															 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
														
 
															 # See the License for the specific language governing permissions and
														
 
															 # limitations under the License.
														
 
															-'''
														
 
															+"""
														
 
															 @File Description:
														
 
															 # 根据test影像文件夹生成test.json
														
 
															 python ./coco_tools/json_Img2Json.py \
														
 
															     --test_image_path=./test2017 \
														
 
															     --json_train_path=./annotations/instances_val2017.json \
														
 
															     --json_test_path=./test.json
														
 
															-'''
														
 
															+"""
														
 
															+
														
 
															 import os, cv2
														
 
															 import json
														
 
															 import argparse
														
--- a/tools/coco_tools/json_ImgSta.py
+++ b/tools/coco_tools/json_ImgSta.py
@@ -11,7 +11,7 @@
 
															 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
														
 
															 # See the License for the specific language governing permissions and
														
 
															 # limitations under the License.
														
 
															-'''
														
 
															+"""
														
 
															 @File Description:
														
 
															 # 统计json文件images信息，生成统计结果csv，同时生成图像shape、图像shape比例的二维分布图
														
 
															 python ./coco_tools/json_ImgSta.py \
														
@@ -19,7 +19,7 @@ python ./coco_tools/json_ImgSta.py \
 
															     --csv_path=./img_sta/images.csv \
														
 
															     --png_shape_path=./img_sta/images_shape.png \
														
 
															     --png_shapeRate_path=./img_sta/images_shapeRate.png
														
 
															-'''
														
 
															+"""
														
 
															 import json
														
 
															 import argparse
														
--- a/tools/coco_tools/json_InfoShow.py
+++ b/tools/coco_tools/json_InfoShow.py
@@ -11,13 +11,13 @@
 
															 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
														
 
															 # See the License for the specific language governing permissions and
														
 
															 # limitations under the License.
														
 
															-'''
														
 
															+"""
														
 
															 @File Description:
														
 
															 # 输出json文件基本信息
														
 
															 python ./coco_tools/json_InfoShow.py \
														
 
															        --json_path=./annotations/instances_val2017.json \
														
 
															        --show_num 5
														
 
															-'''
														
 
															+"""
														
 
															 import json
														
 
															 import argparse
														
--- a/tools/coco_tools/json_Merge.py
+++ b/tools/coco_tools/json_Merge.py
@@ -11,14 +11,14 @@
 
															 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
														
 
															 # See the License for the specific language governing permissions and
														
 
															 # limitations under the License.
														
 
															-'''
														
 
															+"""
														
 
															 @File Description:
														
 
															 # 合并json文件，可以通过merge_keys控制合并的字段, 默认合并'images', 'annotations'字段
														
 
															 python ./coco_tools/json_Merge.py \
														
 
															     --json1_path=./annotations/instances_train2017.json \
														
 
															     --json2_path=./annotations/instances_val2017.json \
														
 
															     --save_path=./instances_trainval2017.json
														
 
															-'''
														
 
															+"""
														
 
															 import json
														
 
															 import argparse
														
--- a/tools/coco_tools/json_Split.py
+++ b/tools/coco_tools/json_Split.py
@@ -11,14 +11,14 @@
 
															 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
														
 
															 # See the License for the specific language governing permissions and
														
 
															 # limitations under the License.
														
 
															-'''
														
 
															+"""
														
 
															 @File Description:
														
 
															 # json数据集划分，可以通过val_split_rate、val_split_num控制划分比例或个数, keep_val_inTrain可以设定是否在train中保留val相关信息
														
 
															 python ./coco_tools/json_Split.py \
														
 
															     --json_all_path=./annotations/instances_val2017.json \
														
 
															     --json_train_path=./instances_val2017_train.json \
														
 
															     --json_val_path=./instances_val2017_val.json
														
 
															-'''
														
 
															+"""
														
 
															 import json
														
 
															 import argparse
														
--- a/tools/match.py
+++ b/tools/match.py
@@ -22,7 +22,7 @@ from utils import Raster, raster2uint8, save_geotiff, time_it
 
															 class MatchError(Exception):

														
 
															     def __str__(self):

														
 
															-        return "Cannot match two images."

														
 
															+        return "Cannot match the two images."

														
 
															 def _calcu_tf(im1, im2):

														
--- a/tools/utils/raster.py
+++ b/tools/utils/raster.py
@@ -48,21 +48,23 @@ def _get_type(type_name: str) -> int:
 
															 class Raster:
														
 
															     def __init__(self,
														
 
															-                 path: Optional[str],
														
 
															+                 path: str,
														
 
															                  gdal_obj: Optional[gdal.Dataset]=None,
														
 
															                  band_list: Union[List[int], Tuple[int], None]=None,
														
 
															                  to_uint8: bool=False) -> None:
														
 
															         """
														
 
															-        Class of raster reader.
														
 
															+        Reader of raster files.
														
 
															         Args:
														
 
															-            path (Optional[str]): Path of raster file.
														
 
															-            gdal_obj (Optional[Any], optional): GDAL dataset. Defaults to None.
														
 
															-            band_list (Union[List[int], Tuple[int], None], optional): 
														
 
															-                Select a set of bands (the band index starts from 1) or None (read all bands). Defaults to None.
														
 
															-            to_uint8 (bool, optional): 
														
 
															-                Whether to convert data type to uint8. Defaults to False.
														
 
															+            path (str): Path of raster file.
														
 
															+            gdal_obj (gdal.Dataset|None, optional): GDAL dataset. Defaults to None.
														
 
															+            band_list (list[int] | tuple[int] | None, optional): Select a set of 
														
 
															+                bands (the band index starts from 1). If None, read all bands. 
														
 
															+                Defaults to None.
														
 
															+            to_uint8 (bool, optional): Whether to convert data type to uint8. 
														
 
															+                Defaults to False.
														
 
															         """
														
 
															+
														
 
															         super(Raster, self).__init__()
														
 
															         if path is not None:
														
 
															             if osp.exists(path):
														
@@ -92,13 +94,15 @@ class Raster:
 
															         self._getType()
														
 
															     def setBands(self, band_list: Union[List[int], Tuple[int], None]) -> None:
														
 
															-        """ 
														
 
															+        """
														
 
															         Set bands of data.
														
 
															         Args:
														
 
															-            band_list (Union[List[int], Tuple[int], None]): 
														
 
															-                Select a set of bands (the band index starts from 1) or None (read all bands). Defaults to None.
														
 
															+            band_list (list[int] | tuple[int] | None, optional): Select a set of 
														
 
															+                bands (the band index starts from 1). If None, read all bands. 
														
 
															+                Defaults to None.
														
 
															         """
														
 
															+
														
 
															         if band_list is not None:
														
 
															             if len(band_list) > self.bands:
														
 
															                 raise ValueError(
														
@@ -113,18 +117,19 @@ class Raster:
 
															                  start_loc: Union[List[int], Tuple[int, int], None]=None,
														
 
															                  block_size: Union[List[int], Tuple[int, int]]=[512, 512]
														
 
															                  ) -> np.ndarray:
														
 
															-        """ 
														
 
															+        """
														
 
															         Fetch data in a ndarray.
														
 
															         Args:
														
 
															-            start_loc (Union[List[int], Tuple[int], None], optional): 
														
 
															-                Coordinates of the upper left corner of the block. None value means returning full image.
														
 
															-            block_size (Union[List[int], Tuple[int]], optional): 
														
 
															-                Block size. Defaults to [512, 512].
														
 
															+            start_loc (list[int] | tuple[int] | None, optional): Coordinates of the 
														
 
															+                upper left corner of the block. None value means returning full image.
														
 
															+            block_size (list[int] | tuple[int], optional): Block size. 
														
 
															+                Defaults to [512, 512].
														
 
															         Returns:
														
 
															             np.ndarray: data's ndarray.
														
 
															         """
														
 
															+
														
 
															         if self._src_data is not None:
														
 
															             if start_loc is None:
														
 
															                 return self._getArray()
														
--- a/tutorials/train/object_detection/faster_rcnn.py
+++ b/tutorials/train/object_detection/faster_rcnn.py
@@ -54,14 +54,14 @@ eval_transforms = T.Compose([
 
															 ])
														
 
															 # 分别构建训练和验证所用的数据集
														
 
															-train_dataset = pdrs.datasets.VOCDetection(
														
 
															+train_dataset = pdrs.datasets.VOCDetDataset(
														
 
															     data_dir=DATA_DIR,
														
 
															     file_list=TRAIN_FILE_LIST_PATH,
														
 
															     label_list=LABEL_LIST_PATH,
														
 
															     transforms=train_transforms,
														
 
															     shuffle=True)
														
 
															-eval_dataset = pdrs.datasets.VOCDetection(
														
 
															+eval_dataset = pdrs.datasets.VOCDetDataset(
														
 
															     data_dir=DATA_DIR,
														
 
															     file_list=EVAL_FILE_LIST_PATH,
														
 
															     label_list=LABEL_LIST_PATH,
														
--- a/tutorials/train/object_detection/ppyolo.py
+++ b/tutorials/train/object_detection/ppyolo.py
@@ -54,14 +54,14 @@ eval_transforms = T.Compose([
 
															 ])
														
 
															 # 分别构建训练和验证所用的数据集
														
 
															-train_dataset = pdrs.datasets.VOCDetection(
														
 
															+train_dataset = pdrs.datasets.VOCDetDataset(
														
 
															     data_dir=DATA_DIR,
														
 
															     file_list=TRAIN_FILE_LIST_PATH,
														
 
															     label_list=LABEL_LIST_PATH,
														
 
															     transforms=train_transforms,
														
 
															     shuffle=True)
														
 
															-eval_dataset = pdrs.datasets.VOCDetection(
														
 
															+eval_dataset = pdrs.datasets.VOCDetDataset(
														
 
															     data_dir=DATA_DIR,
														
 
															     file_list=EVAL_FILE_LIST_PATH,
														
 
															     label_list=LABEL_LIST_PATH,
														
--- a/tutorials/train/object_detection/ppyolotiny.py
+++ b/tutorials/train/object_detection/ppyolotiny.py
@@ -54,14 +54,14 @@ eval_transforms = T.Compose([
 
															 ])
														
 
															 # 分别构建训练和验证所用的数据集
														
 
															-train_dataset = pdrs.datasets.VOCDetection(
														
 
															+train_dataset = pdrs.datasets.VOCDetDataset(
														
 
															     data_dir=DATA_DIR,
														
 
															     file_list=TRAIN_FILE_LIST_PATH,
														
 
															     label_list=LABEL_LIST_PATH,
														
 
															     transforms=train_transforms,
														
 
															     shuffle=True)
														
 
															-eval_dataset = pdrs.datasets.VOCDetection(
														
 
															+eval_dataset = pdrs.datasets.VOCDetDataset(
														
 
															     data_dir=DATA_DIR,
														
 
															     file_list=EVAL_FILE_LIST_PATH,
														
 
															     label_list=LABEL_LIST_PATH,
														
--- a/tutorials/train/object_detection/ppyolov2.py
+++ b/tutorials/train/object_detection/ppyolov2.py
@@ -54,14 +54,14 @@ eval_transforms = T.Compose([
 
															 ])
														
 
															 # 分别构建训练和验证所用的数据集
														
 
															-train_dataset = pdrs.datasets.VOCDetection(
														
 
															+train_dataset = pdrs.datasets.VOCDetDataset(
														
 
															     data_dir=DATA_DIR,
														
 
															     file_list=TRAIN_FILE_LIST_PATH,
														
 
															     label_list=LABEL_LIST_PATH,
														
 
															     transforms=train_transforms,
														
 
															     shuffle=True)
														
 
															-eval_dataset = pdrs.datasets.VOCDetection(
														
 
															+eval_dataset = pdrs.datasets.VOCDetDataset(
														
 
															     data_dir=DATA_DIR,
														
 
															     file_list=EVAL_FILE_LIST_PATH,
														
 
															     label_list=LABEL_LIST_PATH,
														
--- a/tutorials/train/object_detection/yolov3.py
+++ b/tutorials/train/object_detection/yolov3.py
@@ -54,14 +54,14 @@ eval_transforms = T.Compose([
 
															 ])
														
 
															 # 分别构建训练和验证所用的数据集
														
 
															-train_dataset = pdrs.datasets.VOCDetection(
														
 
															+train_dataset = pdrs.datasets.VOCDetDataset(
														
 
															     data_dir=DATA_DIR,
														
 
															     file_list=TRAIN_FILE_LIST_PATH,
														
 
															     label_list=LABEL_LIST_PATH,
														
 
															     transforms=train_transforms,
														
 
															     shuffle=True)
														
 
															-eval_dataset = pdrs.datasets.VOCDetection(
														
 
															+eval_dataset = pdrs.datasets.VOCDetDataset(
														
 
															     data_dir=DATA_DIR,
														
 
															     file_list=EVAL_FILE_LIST_PATH,
														
 
															     label_list=LABEL_LIST_PATH,