пре 3 година · 64c9697a4d
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -1,11 +1,11 @@
 
				 repos:
			
 
				 -   repo: https://github.com/PaddlePaddle/mirrors-yapf.git
			
 
				-    sha: 0d79c0c469bab64f7229c9aca2b1186ef47f0e37
			
 
				+    rev: 0d79c0c469bab64f7229c9aca2b1186ef47f0e37
			
 
				     hooks:
			
 
				     -   id: yapf
			
 
				         files: \.py$
			
 
				 -   repo: https://github.com/pre-commit/pre-commit-hooks
			
 
				-    sha: a11d9314b22d8f8c7556443875b731ef05965464
			
 
				+    rev: a11d9314b22d8f8c7556443875b731ef05965464
			
 
				     hooks:
			
 
				     -   id: check-merge-conflict
			
 
				     -   id: check-symlinks
			
@@ -16,7 +16,7 @@ repos:
 
				     -   id: trailing-whitespace
			
 
				         files: \.md$
			
 
				 -   repo: https://github.com/Lucas-C/pre-commit-hooks
			
 
				-    sha: v1.0.1
			
 
				+    rev: v1.0.1
			
 
				     hooks:
			
 
				     -   id: forbid-crlf
			
 
				         files: \.md$
			
@@ -25,4 +25,4 @@ repos:
 
				     -   id: forbid-tabs
			
 
				         files: \.md$
			
 
				     -   id: remove-tabs
			
 
				-        files: \.md$
			
 
				+        files: \.md$
			
--- a/paddlers/datasets/__init__.py
+++ b/paddlers/datasets/__init__.py
@@ -12,8 +12,8 @@
 
				 # See the License for the specific language governing permissions and
			
 
				 # limitations under the License.
			
 
				 
			
 
				-from .voc import VOCDetection
			
 
				-from .coco import COCODetection
			
 
				+from .voc import VOCDetDataset
			
 
				+from .coco import COCODetDataset
			
 
				 from .seg_dataset import SegDataset
			
 
				 from .cd_dataset import CDDataset
			
 
				 from .clas_dataset import ClasDataset
			
--- a/paddlers/datasets/cd_dataset.py
+++ b/paddlers/datasets/cd_dataset.py
@@ -22,28 +22,33 @@ from paddlers.utils import logging, get_encoding, norm_path, is_pic
 
				 
			
 
				 class CDDataset(BaseDataset):
			
 
				     """
			
 
				-    读取变化检测任务数据集，并对样本进行相应的处理（来自SegDataset，图像标签需要两个）。
			
 
				+    Dataset for change detection tasks.
			
 
				 
			
 
				     Args:
			
 
				-        data_dir (str): 数据集所在的目录路径。
			
 
				-        file_list (str): 描述数据集图片文件和对应标注文件的文件路径（文本内每行路径为相对data_dir的相对路径）。当`with_seg_labels`为
			
 
				-            False（默认设置）时，文件中每一行应依次包含第一时相影像、第二时相影像以及变化检测标签的路径；当`with_seg_labels`为True时，
			
 
				-            文件中每一行应依次包含第一时相影像、第二时相影像、变化检测标签、第一时相建筑物标签以及第二时相建筑物标签的路径。
			
 
				-        label_list (str): 描述数据集包含的类别信息文件路径。默认值为None。
			
 
				-        transforms (paddlers.transforms.Compose): 数据集中每个样本的预处理/增强算子。
			
 
				-        num_workers (int|str): 数据集中样本在预处理过程中的线程或进程数。默认为'auto'。当设为'auto'时，根据
			
 
				-            系统的实际CPU核数设置`num_workers`: 如果CPU核数的一半大于8，则`num_workers`为8，否则为CPU核数的
			
 
				-            一半。
			
 
				-        shuffle (bool): 是否需要对数据集中样本打乱顺序。默认为False。
			
 
				-        with_seg_labels (bool, optional): 数据集中是否包含两个时相的语义分割标签。默认为False。
			
 
				-        binarize_labels (bool, optional): 是否对数据集中的标签进行二值化操作。默认为False。
			
 
				+        data_dir (str): Root directory of the dataset.
			
 
				+        file_list (str): Path of the file that contains relative paths of images and annotation files. When 
			
 
				+            `with_seg_labels` False, each line in the file contains the paths of the bi-temporal images and
			
 
				+            the change mask. When `with_seg_labels` is True, each line in the file contains the paths of the
			
 
				+            bi-temporal images, the path of the change mask, and the paths of the segmentation masks in both
			
 
				+            temporal phases.
			
 
				+        transforms (paddlers.transforms.Compose): Data preprocessing and data augmentation operators to apply.
			
 
				+        label_list (str, optional): Path of the file that contains the category names. Defaults to None.
			
 
				+        num_workers (int|str, optional): Number of processes used for data loading. If `num_workers` is 'auto',
			
 
				+            the number of workers will be automatically determined according to the number of CPU cores: If 
			
 
				+            there are more than 16 cores，8 workers will be used. Otherwise, the number of workers will be half 
			
 
				+            the number of CPU cores. Defaults: 'auto'.
			
 
				+        shuffle (bool, optional): Whether to shuffle the samples. Defaults to False.
			
 
				+        with_seg_labels (bool, optional): Set `with_seg_labels` to True if the datasets provides segmentation 
			
 
				+            masks (e.g., building masks in each temporal phase). Defaults to False.
			
 
				+        binarize_labels (bool, optional): Whether to binarize change masks and segmentation masks. 
			
 
				+            Defaults to False.
			
 
				     """
			
 
				 
			
 
				     def __init__(self,
			
 
				                  data_dir,
			
 
				                  file_list,
			
 
				+                 transforms,
			
 
				                  label_list=None,
			
 
				-                 transforms=None,
			
 
				                  num_workers='auto',
			
 
				                  shuffle=False,
			
 
				                  with_seg_labels=False,
			
@@ -64,8 +69,7 @@ class CDDataset(BaseDataset):
 
				             num_items = 3  # RGB1, RGB2, CD
			
 
				         self.binarize_labels = binarize_labels
			
 
				 
			
 
				-        # TODO：非None时，让用户跳转数据集分析生成label_list
			
 
				-        # 不要在此处分析label file
			
 
				+        # TODO: If `label_list` is not None, let the user parse `label_list`.
			
 
				         if label_list is not None:
			
 
				             with open(label_list, encoding=get_encoding(label_list)) as f:
			
 
				                 for line in f:
			
@@ -77,7 +81,7 @@ class CDDataset(BaseDataset):
 
				                 items = line.strip().split(DELIMETER)
			
 
				 
			
 
				                 if len(items) != num_items:
			
 
				-                    raise Exception(
			
 
				+                    raise ValueError(
			
 
				                         "Line[{}] in file_list[{}] has an incorrect number of file paths.".
			
 
				                         format(line.strip(), file_list))
			
 
				 
			
@@ -148,7 +152,10 @@ class CDDataset(BaseDataset):
 
				 
			
 
				 
			
 
				 class MaskType(IntEnum):
			
 
				-    """Enumeration of the mask types used in the change detection task."""
			
 
				+    """
			
 
				+    Enumeration of the mask types used in the change detection task.
			
 
				+    """
			
 
				+
			
 
				     CD = 0
			
 
				     SEG_T1 = 1
			
 
				     SEG_T2 = 2
			
--- a/paddlers/datasets/clas_dataset.py
+++ b/paddlers/datasets/clas_dataset.py
@@ -19,24 +19,26 @@ from paddlers.utils import logging, get_encoding, norm_path, is_pic
 
				 
			
 
				 
			
 
				 class ClasDataset(BaseDataset):
			
 
				-    """读取图像分类任务数据集，并对样本进行相应的处理。
			
 
				+    """
			
 
				+    Dataset for scene classification tasks.
			
 
				 
			
 
				     Args:
			
 
				-        data_dir (str): 数据集所在的目录路径。
			
 
				-        file_list (str): 描述数据集图片文件和对应标注序号（文本内每行路径为相对data_dir的相对路）。
			
 
				-        label_list (str): 描述数据集包含的类别信息文件路径，文件格式为（类别 说明）。默认值为None。
			
 
				-        transforms (paddlers.transforms.Compose): 数据集中每个样本的预处理/增强算子。
			
 
				-        num_workers (int|str): 数据集中样本在预处理过程中的线程或进程数。默认为'auto'。当设为'auto'时，根据
			
 
				-            系统的实际CPU核数设置`num_workers`: 如果CPU核数的一半大于8，则`num_workers`为8，否则为CPU核数的
			
 
				-            一半。
			
 
				-        shuffle (bool): 是否需要对数据集中样本打乱顺序。默认为False。
			
 
				+        data_dir (str): Root directory of the dataset.
			
 
				+        file_list (str): Path of the file that contains relative paths of images and labels.
			
 
				+        transforms (paddlers.transforms.Compose): Data preprocessing and data augmentation operators to apply.
			
 
				+        label_list (str, optional): Path of the file that contains the category names. Defaults to None.
			
 
				+        num_workers (int|str, optional): Number of processes used for data loading. If `num_workers` is 'auto',
			
 
				+            the number of workers will be automatically determined according to the number of CPU cores: If 
			
 
				+            there are more than 16 cores，8 workers will be used. Otherwise, the number of workers will be half 
			
 
				+            the number of CPU cores. Defaults: 'auto'.
			
 
				+        shuffle (bool, optional): Whether to shuffle the samples. Defaults to False.
			
 
				     """
			
 
				 
			
 
				     def __init__(self,
			
 
				                  data_dir,
			
 
				                  file_list,
			
 
				+                 transforms,
			
 
				                  label_list=None,
			
 
				-                 transforms=None,
			
 
				                  num_workers='auto',
			
 
				                  shuffle=False):
			
 
				         super(ClasDataset, self).__init__(data_dir, label_list, transforms,
			
@@ -57,7 +59,7 @@ class ClasDataset(BaseDataset):
 
				             for line in f:
			
 
				                 items = line.strip().split()
			
 
				                 if len(items) > 2:
			
 
				-                    raise Exception(
			
 
				+                    raise ValueError(
			
 
				                         "A space is defined as the delimiter to separate the image and label path, " \
			
 
				                         "so the space cannot be in the image or label path, but the line[{}] of " \
			
 
				                         " file_list[{}] has a space in the image or label path.".format(line, file_list))
			
--- a/paddlers/datasets/coco.py
+++ b/paddlers/datasets/coco.py
@@ -27,29 +27,32 @@ from paddlers.transforms import DecodeImg, MixupImage
 
				 from paddlers.tools import YOLOAnchorCluster
			
 
				 
			
 
				 
			
 
				-class COCODetection(BaseDataset):
			
 
				-    """读取COCO格式的检测数据集，并对样本进行相应的处理。
			
 
				+class COCODetDataset(BaseDataset):
			
 
				+    """
			
 
				+    Dataset with COCO annotations for detection tasks.
			
 
				 
			
 
				     Args:
			
 
				-        data_dir (str): 数据集所在的目录路径。
			
 
				-        image_dir (str): 描述数据集图片文件路径。
			
 
				-        anno_path (str): COCO标注文件路径。
			
 
				-        label_list (str): 描述数据集包含的类别信息文件路径。
			
 
				-        transforms (paddlers.transforms.Compose): 数据集中每个样本的预处理/增强算子。
			
 
				-        num_workers (int|str): 数据集中样本在预处理过程中的线程或进程数。默认为'auto'。当设为'auto'时，根据
			
 
				-            系统的实际CPU核数设置`num_workers`: 如果CPU核数的一半大于8，则`num_workers`为8，否则为CPU核数的
			
 
				-            一半。
			
 
				-        shuffle (bool): 是否需要对数据集中样本打乱顺序。默认为False。
			
 
				-        allow_empty (bool): 是否加载负样本。默认为False。
			
 
				-        empty_ratio (float): 用于指定负样本占总样本数的比例。如果小于0或大于等于1，则保留全部的负样本。默认为1。
			
 
				+        data_dir (str): Root directory of the dataset.
			
 
				+        image_dir (str): Directory that contains the images.
			
 
				+        ann_path (str): Path to COCO annotations.
			
 
				+        transforms (paddlers.transforms.Compose): Data preprocessing and data augmentation operators to apply.
			
 
				+        label_list (str, optional): Path of the file that contains the category names. Defaults to None.
			
 
				+        num_workers (int|str, optional): Number of processes used for data loading. If `num_workers` is 'auto',
			
 
				+            the number of workers will be automatically determined according to the number of CPU cores: If 
			
 
				+            there are more than 16 cores，8 workers will be used. Otherwise, the number of workers will be half 
			
 
				+            the number of CPU cores. Defaults: 'auto'.
			
 
				+        shuffle (bool, optional): Whether to shuffle the samples. Defaults to False.
			
 
				+        allow_empty (bool, optional): Whether to add negative samples. Defaults to False.
			
 
				+        empty_ratio (float, optional): Ratio of negative samples. If `empty_ratio` is smaller than 0 or not less 
			
 
				+            than 1, keep all generated negative samples. Defaults to 1.0.
			
 
				     """
			
 
				 
			
 
				     def __init__(self,
			
 
				                  data_dir,
			
 
				                  image_dir,
			
 
				                  anno_path,
			
 
				+                 transforms,
			
 
				                  label_list,
			
 
				-                 transforms=None,
			
 
				                  num_workers='auto',
			
 
				                  shuffle=False,
			
 
				                  allow_empty=False,
			
@@ -60,8 +63,8 @@ class COCODetection(BaseDataset):
 
				         import matplotlib
			
 
				         matplotlib.use('Agg')
			
 
				         from pycocotools.coco import COCO
			
 
				-        super(COCODetection, self).__init__(data_dir, label_list, transforms,
			
 
				-                                            num_workers, shuffle)
			
 
				+        super(COCODetDataset, self).__init__(data_dir, label_list, transforms,
			
 
				+                                             num_workers, shuffle)
			
 
				 
			
 
				         self.data_fields = None
			
 
				         self.num_max_boxes = 50
			
@@ -281,15 +284,16 @@ class COCODetection(BaseDataset):
 
				             https://github.com/ultralytics/yolov5/blob/master/utils/autoanchor.py
			
 
				 
			
 
				         Args:
			
 
				-            num_anchors (int): number of clusters
			
 
				-            image_size (list or int): [h, w], being an int means image height and image width are the same.
			
 
				-            cache (bool): whether using cache
			
 
				-            cache_path (str or None, optional): cache directory path. If None, use `data_dir` of dataset.
			
 
				-            iters (int, optional): iters of kmeans algorithm
			
 
				-            gen_iters (int, optional): iters of genetic algorithm
			
 
				-            threshold (float, optional): anchor scale threshold
			
 
				-            verbose (bool, optional): whether print results
			
 
				+            num_anchors (int): Number of clusters.
			
 
				+            image_size (list[int]|int): [h, w] or an int value that corresponds to the shape [image_size, image_size].
			
 
				+            cache (bool, optional): Whether to use cache. Defaults to True.
			
 
				+            cache_path (str|None, optional): Path of cache directory. If None, use `dataset.data_dir`. 
			
 
				+                Defaults to None.
			
 
				+            iters (int, optional): Iterations of k-means algorithm. Defaults to 300.
			
 
				+            gen_iters (int, optional): Iterations of genetic algorithm. Defaults to 1000.
			
 
				+            thresh (float, optional): Anchor scale threshold. Defaults to 0.25.
			
 
				         """
			
 
				+
			
 
				         if cache_path is None:
			
 
				             cache_path = self.data_dir
			
 
				         cluster = YOLOAnchorCluster(
			
@@ -305,17 +309,18 @@ class COCODetection(BaseDataset):
 
				         return anchors
			
 
				 
			
 
				     def add_negative_samples(self, image_dir, empty_ratio=1):
			
 
				-        """将背景图片加入训练
			
 
				+        """
			
 
				+        Generate and add negative samples.
			
 
				 
			
 
				         Args:
			
 
				-            image_dir (str)：背景图片所在的文件夹目录。
			
 
				-            empty_ratio (float or None): 用于指定负样本占总样本数的比例。如果为None，保留数据集初始化是设置的`empty_ratio`值，
			
 
				-                否则更新原有`empty_ratio`值。如果小于0或大于等于1，则保留全部的负样本。默认为1。
			
 
				-
			
 
				+            image_dir (str): Directory that contains images.
			
 
				+            empty_ratio (float|None, optional): Ratio of negative samples. If `empty_ratio` is smaller than
			
 
				+                0 or not less than 1, keep all generated negative samples. Defaults to 1.0.
			
 
				         """
			
 
				+
			
 
				         import cv2
			
 
				         if not osp.isdir(image_dir):
			
 
				-            raise Exception("{} is not a valid image directory.".format(
			
 
				+            raise ValueError("{} is not a valid image directory.".format(
			
 
				                 image_dir))
			
 
				         if empty_ratio is not None:
			
 
				             self.empty_ratio = empty_ratio
			
--- a/paddlers/datasets/seg_dataset.py
+++ b/paddlers/datasets/seg_dataset.py
@@ -20,24 +20,26 @@ from paddlers.utils import logging, get_encoding, norm_path, is_pic
 
				 
			
 
				 
			
 
				 class SegDataset(BaseDataset):
			
 
				-    """读取语义分割任务数据集，并对样本进行相应的处理。
			
 
				+    """
			
 
				+    Dataset for semantic segmentation tasks.
			
 
				 
			
 
				     Args:
			
 
				-        data_dir (str): 数据集所在的目录路径。
			
 
				-        file_list (str): 描述数据集图片文件和对应标注文件的文件路径（文本内每行路径为相对data_dir的相对路）。
			
 
				-        label_list (str): 描述数据集包含的类别信息文件路径。默认值为None。
			
 
				-        transforms (paddlers.transforms.Compose): 数据集中每个样本的预处理/增强算子。
			
 
				-        num_workers (int|str): 数据集中样本在预处理过程中的线程或进程数。默认为'auto'。当设为'auto'时，根据
			
 
				-            系统的实际CPU核数设置`num_workers`: 如果CPU核数的一半大于8，则`num_workers`为8，否则为CPU核数的
			
 
				-            一半。
			
 
				-        shuffle (bool): 是否需要对数据集中样本打乱顺序。默认为False。
			
 
				+        data_dir (str): Root directory of the dataset.
			
 
				+        file_list (str): Path of the file that contains relative paths of images and annotation files.
			
 
				+        transforms (paddlers.transforms.Compose): Data preprocessing and data augmentation operators to apply.
			
 
				+        label_list (str, optional): Path of the file that contains the category names. Defaults to None.
			
 
				+        num_workers (int|str, optional): Number of processes used for data loading. If `num_workers` is 'auto',
			
 
				+            the number of workers will be automatically determined according to the number of CPU cores: If 
			
 
				+            there are more than 16 cores，8 workers will be used. Otherwise, the number of workers will be half 
			
 
				+            the number of CPU cores. Defaults: 'auto'.
			
 
				+        shuffle (bool, optional): Whether to shuffle the samples. Defaults to False.
			
 
				     """
			
 
				 
			
 
				     def __init__(self,
			
 
				                  data_dir,
			
 
				                  file_list,
			
 
				+                 transforms,
			
 
				                  label_list=None,
			
 
				-                 transforms=None,
			
 
				                  num_workers='auto',
			
 
				                  shuffle=False):
			
 
				         super(SegDataset, self).__init__(data_dir, label_list, transforms,
			
@@ -58,7 +60,7 @@ class SegDataset(BaseDataset):
 
				             for line in f:
			
 
				                 items = line.strip().split()
			
 
				                 if len(items) > 2:
			
 
				-                    raise Exception(
			
 
				+                    raise ValueError(
			
 
				                         "A space is defined as the delimiter to separate the image and label path, " \
			
 
				                         "so the space cannot be in the image or label path, but the line[{}] of " \
			
 
				                         " file_list[{}] has a space in the image or label path.".format(line, file_list))
			
--- a/paddlers/datasets/voc.py
+++ b/paddlers/datasets/voc.py
@@ -29,27 +29,30 @@ from paddlers.transforms import DecodeImg, MixupImage
 
				 from paddlers.tools import YOLOAnchorCluster
			
 
				 
			
 
				 
			
 
				-class VOCDetection(BaseDataset):
			
 
				-    """读取PascalVOC格式的检测数据集，并对样本进行相应的处理。
			
 
				+class VOCDetDataset(BaseDataset):
			
 
				+    """
			
 
				+    Dataset with PASCAL VOC annotations for detection tasks.
			
 
				 
			
 
				     Args:
			
 
				-        data_dir (str): 数据集所在的目录路径。
			
 
				-        file_list (str): 描述数据集图片文件和对应标注文件的文件路径（文本内每行路径为相对data_dir的相对路）。
			
 
				-        label_list (str): 描述数据集包含的类别信息文件路径。
			
 
				-        transforms (paddlers.transforms.Compose): 数据集中每个样本的预处理/增强算子。
			
 
				-        num_workers (int|str): 数据集中样本在预处理过程中的线程或进程数。默认为'auto'。当设为'auto'时，根据
			
 
				-            系统的实际CPU核数设置`num_workers`: 如果CPU核数的一半大于8，则`num_workers`为8，否则为CPU核数的
			
 
				-            一半。
			
 
				-        shuffle (bool): 是否需要对数据集中样本打乱顺序。默认为False。
			
 
				-        allow_empty (bool): 是否加载负样本。默认为False。
			
 
				-        empty_ratio (float): 用于指定负样本占总样本数的比例。如果小于0或大于等于1，则保留全部的负样本。默认为1。
			
 
				+        data_dir (str): Root directory of the dataset.
			
 
				+        file_list (str): Path of the file that contains relative paths of images and annotation files.
			
 
				+        transforms (paddlers.transforms.Compose): Data preprocessing and data augmentation operators to apply.
			
 
				+        label_list (str, optional): Path of the file that contains the category names. Defaults to None.
			
 
				+        num_workers (int|str, optional): Number of processes used for data loading. If `num_workers` is 'auto',
			
 
				+            the number of workers will be automatically determined according to the number of CPU cores: If 
			
 
				+            there are more than 16 cores，8 workers will be used. Otherwise, the number of workers will be half 
			
 
				+            the number of CPU cores. Defaults: 'auto'.
			
 
				+        shuffle (bool, optional): Whether to shuffle the samples. Defaults to False.
			
 
				+        allow_empty (bool, optional): Whether to add negative samples. Defaults to False.
			
 
				+        empty_ratio (float, optional): Ratio of negative samples. If `empty_ratio` is smaller than 0 or not less 
			
 
				+            than 1, keep all generated negative samples. Defaults to 1.0.
			
 
				     """
			
 
				 
			
 
				     def __init__(self,
			
 
				                  data_dir,
			
 
				                  file_list,
			
 
				+                 transforms,
			
 
				                  label_list,
			
 
				-                 transforms=None,
			
 
				                  num_workers='auto',
			
 
				                  shuffle=False,
			
 
				                  allow_empty=False,
			
@@ -60,8 +63,8 @@ class VOCDetection(BaseDataset):
 
				         import matplotlib
			
 
				         matplotlib.use('Agg')
			
 
				         from pycocotools.coco import COCO
			
 
				-        super(VOCDetection, self).__init__(data_dir, label_list, transforms,
			
 
				-                                           num_workers, shuffle)
			
 
				+        super(VOCDetDataset, self).__init__(data_dir, label_list, transforms,
			
 
				+                                            num_workers, shuffle)
			
 
				 
			
 
				         self.data_fields = None
			
 
				         self.num_max_boxes = 50
			
@@ -109,9 +112,9 @@ class VOCDetection(BaseDataset):
 
				                 if not line:
			
 
				                     break
			
 
				                 if len(line.strip().split()) > 2:
			
 
				-                    raise Exception("A space is defined as the separator, "
			
 
				-                                    "but it exists in image or label name {}."
			
 
				-                                    .format(line))
			
 
				+                    raise ValueError("A space is defined as the separator, "
			
 
				+                                     "but it exists in image or label name {}."
			
 
				+                                     .format(line))
			
 
				                 img_file, xml_file = [
			
 
				                     osp.join(data_dir, x) for x in line.strip().split()[:2]
			
 
				                 ]
			
@@ -345,15 +348,16 @@ class VOCDetection(BaseDataset):
 
				             https://github.com/ultralytics/yolov5/blob/master/utils/autoanchor.py
			
 
				 
			
 
				         Args:
			
 
				-            num_anchors (int): number of clusters
			
 
				-            image_size (list or int): [h, w], being an int means image height and image width are the same.
			
 
				-            cache (bool): whether using cache
			
 
				-            cache_path (str or None, optional): cache directory path. If None, use `data_dir` of dataset.
			
 
				-            iters (int, optional): iters of kmeans algorithm
			
 
				-            gen_iters (int, optional): iters of genetic algorithm
			
 
				-            threshold (float, optional): anchor scale threshold
			
 
				-            verbose (bool, optional): whether print results
			
 
				+            num_anchors (int): Number of clusters.
			
 
				+            image_size (list[int]|int): [h, w] or an int value that corresponds to the shape [image_size, image_size].
			
 
				+            cache (bool, optional): Whether to use cache. Defaults to True.
			
 
				+            cache_path (str|None, optional): Path of cache directory. If None, use `dataset.data_dir`. 
			
 
				+                Defaults to None.
			
 
				+            iters (int, optional): Iterations of k-means algorithm. Defaults to 300.
			
 
				+            gen_iters (int, optional): Iterations of genetic algorithm. Defaults to 1000.
			
 
				+            thresh (float, optional): Anchor scale threshold. Defaults to 0.25.
			
 
				         """
			
 
				+
			
 
				         if cache_path is None:
			
 
				             cache_path = self.data_dir
			
 
				         cluster = YOLOAnchorCluster(
			
@@ -369,17 +373,18 @@ class VOCDetection(BaseDataset):
 
				         return anchors
			
 
				 
			
 
				     def add_negative_samples(self, image_dir, empty_ratio=1):
			
 
				-        """将背景图片加入训练
			
 
				+        """
			
 
				+        Generate and add negative samples.
			
 
				 
			
 
				         Args:
			
 
				-            image_dir (str)：背景图片所在的文件夹目录。
			
 
				-            empty_ratio (float or None): 用于指定负样本占总样本数的比例。如果为None，保留数据集初始化是设置的`empty_ratio`值，
			
 
				-                否则更新原有`empty_ratio`值。如果小于0或大于等于1，则保留全部的负样本。默认为1。
			
 
				-
			
 
				+            image_dir (str): Directory that contains images.
			
 
				+            empty_ratio (float|None, optional): Ratio of negative samples. If `empty_ratio` is smaller than
			
 
				+                0 or not less than 1, keep all generated negative samples. Defaults to 1.0.
			
 
				         """
			
 
				+
			
 
				         import cv2
			
 
				         if not osp.isdir(image_dir):
			
 
				-            raise Exception("{} is not a valid image directory.".format(
			
 
				+            raise ValueError("{} is not a valid image directory.".format(
			
 
				                 image_dir))
			
 
				         if empty_ratio is not None:
			
 
				             self.empty_ratio = empty_ratio
			
--- a/paddlers/deploy/predictor.py
+++ b/paddlers/deploy/predictor.py
@@ -39,20 +39,20 @@ class Predictor(object):
 
				                  max_trt_batch_size=1,
			
 
				                  trt_precision_mode='float32'):
			
 
				         """ 
			
 
				-        创建Paddle Predictor
			
 
				-
			
 
				         Args:
			
 
				-            model_dir: 模型路径（必须是导出的部署或量化模型）。
			
 
				-            use_gpu: 是否使用GPU，默认为False。
			
 
				-            gpu_id: 使用GPU的ID，默认为0。
			
 
				-            cpu_thread_num：使用cpu进行预测时的线程数，默认为1。
			
 
				-            use_mkl: 是否使用mkldnn计算库，CPU情况下使用，默认为False。
			
 
				-            mkl_thread_num: mkldnn计算线程数，默认为4。
			
 
				-            use_trt: 是否使用TensorRT，默认为False。
			
 
				-            use_glog: 是否启用glog日志, 默认为False。
			
 
				-            memory_optimize: 是否启动内存优化，默认为True。
			
 
				-            max_trt_batch_size: 在使用TensorRT时配置的最大batch size，默认为1。
			
 
				-            trt_precision_mode：在使用TensorRT时采用的精度，可选值['float32', 'float16']。默认为'float32'。
			
 
				+            model_dir (str): Path of the exported model.
			
 
				+            use_gpu (bool, optional): Whether to use a GPU. Defaults to False.
			
 
				+            gpu_id (int, optional): GPU ID. Defaults to 0.
			
 
				+            cpu_thread_num (int, optional): Number of threads to use when making predictions using CPUs. 
			
 
				+                Defaults to 1.
			
 
				+            use_mkl (bool, optional): Whether to use MKL-DNN. Defaults to False.
			
 
				+            mkl_thread_num (int, optional): Number of MKL threads. Defaults to 4.
			
 
				+            use_trt (bool, optional): Whether to use TensorRT. Defaults to False.
			
 
				+            use_glog (bool, optional): Whether to enable glog logs. Defaults to False.
			
 
				+            memory_optimize (bool, optional): Whether to enable memory optimization. Defaults to True.
			
 
				+            max_trt_batch_size (int, optional): Maximum batch size when configured with TensorRT. Defaults to 1.
			
 
				+            trt_precision_mode (str, optional)：Precision to use when configured with TensorRT. Possible values 
			
 
				+                are {'float32', 'float16'}. Defaults to 'float32'.
			
 
				         """
			
 
				 
			
 
				         self.model_dir = model_dir
			
@@ -209,10 +209,13 @@ class Predictor(object):
 
				         return preds
			
 
				 
			
 
				     def raw_predict(self, inputs):
			
 
				-        """ 接受预处理过后的数据进行预测
			
 
				-            Args:
			
 
				-                inputs(dict): 预处理过后的数据
			
 
				+        """ 
			
 
				+        Predict according to preprocessed inputs.
			
 
				+
			
 
				+        Args:
			
 
				+            inputs (dict): Preprocessed inputs.
			
 
				         """
			
 
				+
			
 
				         input_names = self.predictor.get_input_names()
			
 
				         for name in input_names:
			
 
				             input_tensor = self.predictor.get_input_handle(name)
			
@@ -253,21 +256,22 @@ class Predictor(object):
 
				                 warmup_iters=0,
			
 
				                 repeats=1):
			
 
				         """
			
 
				-            Do prediction.
			
 
				-
			
 
				-            Args:
			
 
				-                img_file(list[str | tuple | np.ndarray] | str | tuple | np.ndarray): For scene classification, image restoration, 
			
 
				-                    object detection and semantic segmentation tasks, `img_file` should be either the path of the image to predict
			
 
				-                    , a decoded image (a np.ndarray, which should be consistent with what you get from passing image path to
			
 
				-                    paddlers.transforms.decode_image()), or a list of image paths or decoded images. For change detection tasks,
			
 
				-                    img_file should be a tuple of image paths, a tuple of decoded images, or a list of tuples.
			
 
				-                topk(int, optional): Top-k values to reserve in a classification result. Defaults to 1.
			
 
				-                transforms (paddlers.transforms.Compose | None, optional): Pipeline of data preprocessing. If None, load transforms
			
 
				-                    from `model.yml`. Defaults to None.
			
 
				-                warmup_iters (int, optional): Warm-up iterations before measuring the execution time. Defaults to 0.
			
 
				-                repeats (int, optional): Number of repetitions to evaluate model inference and data processing speed. If greater than
			
 
				-                    1, the reported time consumption is the average of all repeats. Defaults to 1.
			
 
				+        Do prediction.
			
 
				+
			
 
				+        Args:
			
 
				+            img_file(list[str|tuple|np.ndarray] | str | tuple | np.ndarray): For scene classification, image restoration, 
			
 
				+                object detection and semantic segmentation tasks, `img_file` should be either the path of the image to predict
			
 
				+                , a decoded image (a np.ndarray, which should be consistent with what you get from passing image path to
			
 
				+                paddlers.transforms.decode_image()), or a list of image paths or decoded images. For change detection tasks,
			
 
				+                img_file should be a tuple of image paths, a tuple of decoded images, or a list of tuples.
			
 
				+            topk(int, optional): Top-k values to reserve in a classification result. Defaults to 1.
			
 
				+            transforms (paddlers.transforms.Compose|None, optional): Pipeline of data preprocessing. If None, load transforms
			
 
				+                from `model.yml`. Defaults to None.
			
 
				+            warmup_iters (int, optional): Warm-up iterations before measuring the execution time. Defaults to 0.
			
 
				+            repeats (int, optional): Number of repetitions to evaluate model inference and data processing speed. If greater than
			
 
				+                1, the reported time consumption is the average of all repeats. Defaults to 1.
			
 
				         """
			
 
				+
			
 
				         if repeats < 1:
			
 
				             logging.error("`repeats` must be greater than 1.", exit=True)
			
 
				         if transforms is None and not hasattr(self._model, 'test_transforms'):
			
--- a/paddlers/rs_models/cd/backbones/resnet.py
+++ b/paddlers/rs_models/cd/backbones/resnet.py
@@ -162,14 +162,17 @@ class BottleneckBlock(nn.Layer):
 
				 
			
 
				 
			
 
				 class ResNet(nn.Layer):
			
 
				-    """ResNet model from
			
 
				-    `"Deep Residual Learning for Image Recognition" <https://arxiv.org/pdf/1512.03385.pdf>`_
			
 
				+    """
			
 
				+    ResNet model from "Deep Residual Learning for Image Recognition" 
			
 
				+        (https://arxiv.org/pdf/1512.03385.pdf)
			
 
				+    
			
 
				     Args:
			
 
				         Block (BasicBlock|BottleneckBlock): block module of model.
			
 
				         depth (int): layers of resnet, default: 50.
			
 
				-        num_classes (int): output dim of last fc layer. If num_classes <=0, last fc layer 
			
 
				-                            will not be defined. Default: 1000.
			
 
				+        num_classes (int): output dim of last fc layer. If num_classes <=0, last fc 
			
 
				+            layer will not be defined. Default: 1000.
			
 
				         with_pool (bool): use pool before the last fc layer or not. Default: True.
			
 
				+    
			
 
				     Examples:
			
 
				         .. code-block:: python
			
 
				             from paddle.vision.models import ResNet
			
@@ -283,7 +286,8 @@ def _resnet(arch, Block, depth, pretrained, **kwargs):
 
				 
			
 
				 
			
 
				 def resnet18(pretrained=False, **kwargs):
			
 
				-    """ResNet 18-layer model
			
 
				+    """
			
 
				+    ResNet 18-layer model
			
 
				     
			
 
				     Args:
			
 
				         pretrained (bool): If True, returns a model pre-trained on ImageNet
			
@@ -299,7 +303,8 @@ def resnet18(pretrained=False, **kwargs):
 
				 
			
 
				 
			
 
				 def resnet34(pretrained=False, **kwargs):
			
 
				-    """ResNet 34-layer model
			
 
				+    """
			
 
				+    ResNet 34-layer model
			
 
				     
			
 
				     Args:
			
 
				         pretrained (bool): If True, returns a model pre-trained on ImageNet
			
@@ -316,10 +321,12 @@ def resnet34(pretrained=False, **kwargs):
 
				 
			
 
				 
			
 
				 def resnet50(pretrained=False, **kwargs):
			
 
				-    """ResNet 50-layer model
			
 
				+    """
			
 
				+    ResNet 50-layer model
			
 
				     
			
 
				     Args:
			
 
				         pretrained (bool): If True, returns a model pre-trained on ImageNet
			
 
				+
			
 
				     Examples:
			
 
				         .. code-block:: python
			
 
				             from paddle.vision.models import resnet50
			
@@ -332,10 +339,12 @@ def resnet50(pretrained=False, **kwargs):
 
				 
			
 
				 
			
 
				 def resnet101(pretrained=False, **kwargs):
			
 
				-    """ResNet 101-layer model
			
 
				+    """
			
 
				+    ResNet 101-layer model
			
 
				     
			
 
				     Args:
			
 
				         pretrained (bool): If True, returns a model pre-trained on ImageNet
			
 
				+
			
 
				     Examples:
			
 
				         .. code-block:: python
			
 
				             from paddle.vision.models import resnet101
			
@@ -348,10 +357,12 @@ def resnet101(pretrained=False, **kwargs):
 
				 
			
 
				 
			
 
				 def resnet152(pretrained=False, **kwargs):
			
 
				-    """ResNet 152-layer model
			
 
				+    """
			
 
				+    ResNet 152-layer model
			
 
				     
			
 
				     Args:
			
 
				         pretrained (bool): If True, returns a model pre-trained on ImageNet
			
 
				+        
			
 
				     Examples:
			
 
				         .. code-block:: python
			
 
				             from paddle.vision.models import resnet152
			
--- a/paddlers/rs_models/cd/bit.py
+++ b/paddlers/rs_models/cd/bit.py
@@ -42,24 +42,24 @@ class BIT(nn.Layer):
 
				     This implementation adopts pretrained encoders, as opposed to the original work where weights are randomly initialized.
			
 
				 
			
 
				     Args:
			
 
				-        in_channels (int): The number of bands of the input images.
			
 
				-        num_classes (int): The number of target classes.
			
 
				+        in_channels (int): Number of bands of the input images.
			
 
				+        num_classes (int): Number of target classes.
			
 
				         backbone (str, optional): The ResNet architecture that is used as the backbone. Currently, only 'resnet18' and 
			
 
				             'resnet34' are supported. Default: 'resnet18'.
			
 
				-        n_stages (int, optional): The number of ResNet stages used in the backbone, which should be a value in {3,4,5}. 
			
 
				+        n_stages (int, optional): Number of ResNet stages used in the backbone, which should be a value in {3,4,5}. 
			
 
				             Default: 4.
			
 
				         use_tokenizer (bool, optional): Use a tokenizer or not. Default: True.
			
 
				-        token_len (int, optional): The length of input tokens. Default: 4.
			
 
				+        token_len (int, optional): Length of input tokens. Default: 4.
			
 
				         pool_mode (str, optional): The pooling strategy to obtain input tokens when `use_tokenizer` is set to False. 'max'
			
 
				             for global max pooling and 'avg' for global average pooling. Default: 'max'.
			
 
				-        pool_size (int, optional): The height and width of the pooled feature maps when `use_tokenizer` is set to False. 
			
 
				+        pool_size (int, optional): Height and width of the pooled feature maps when `use_tokenizer` is set to False. 
			
 
				             Default: 2.
			
 
				         enc_with_pos (bool, optional): Whether to add leanred positional embedding to the input feature sequence of the 
			
 
				             encoder. Default: True.
			
 
				-        enc_depth (int, optional): The number of attention blocks used in the encoder. Default: 1
			
 
				-        enc_head_dim (int, optional): The embedding dimension of each encoder head. Default: 64.
			
 
				-        dec_depth (int, optional): The number of attention blocks used in the decoder. Default: 8.
			
 
				-        dec_head_dim (int, optional): The embedding dimension of each decoder head. Default: 8.
			
 
				+        enc_depth (int, optional): Number of attention blocks used in the encoder. Default: 1
			
 
				+        enc_head_dim (int, optional): Embedding dimension of each encoder head. Default: 64.
			
 
				+        dec_depth (int, optional): Number of attention blocks used in the decoder. Default: 8.
			
 
				+        dec_head_dim (int, optional): Embedding dimension of each decoder head. Default: 8.
			
 
				 
			
 
				     Raises:
			
 
				         ValueError: When an unsupported backbone type is specified, or the number of backbone stages is not 3, 4, or 5.
			
--- a/paddlers/rs_models/cd/cdnet.py
+++ b/paddlers/rs_models/cd/cdnet.py
@@ -15,8 +15,23 @@
 
				 import paddle

			
 
				 import paddle.nn as nn

			
 
				 

			
 
				+from .layers import Conv7x7

			
 
				+

			
 
				 

			
 
				 class CDNet(nn.Layer):

			
 
				+    """

			
 
				+    The CDNet implementation based on PaddlePaddle.

			
 
				+

			
 
				+    The original article refers to

			
 
				+        Pablo F. Alcantarilla, et al., "Street-View Change Detection with Deconvolut

			
 
				+        ional Networks"

			
 
				+        (https://link.springer.com/article/10.1007/s10514-018-9734-5).

			
 
				+

			
 
				+    Args:

			
 
				+        in_channels (int): Number of bands of the input images.

			
 
				+        num_classes (int): Number of target classes.

			
 
				+    """

			
 
				+

			
 
				     def __init__(self, in_channels=6, num_classes=2):

			
 
				         super(CDNet, self).__init__()

			
 
				         self.conv1 = Conv7x7(in_channels, 64, norm=True, act=True)

			
@@ -48,28 +63,3 @@ class CDNet(nn.Layer):
 
				         x = self.conv7(self.upool2(x, ind2))

			
 
				         x = self.conv8(self.upool1(x, ind1))

			
 
				         return [self.conv_out(x)]

			
 
				-

			
 
				-

			
 
				-class Conv7x7(nn.Layer):

			
 
				-    def __init__(self, in_ch, out_ch, norm=False, act=False):

			
 
				-        super(Conv7x7, self).__init__()

			
 
				-        layers = [

			
 
				-            nn.Pad2D(3), nn.Conv2D(

			
 
				-                in_ch, out_ch, 7, bias_attr=(False if norm else None))

			
 
				-        ]

			
 
				-        if norm:

			
 
				-            layers.append(nn.BatchNorm2D(out_ch))

			
 
				-        if act:

			
 
				-            layers.append(nn.ReLU())

			
 
				-        self.layers = nn.Sequential(*layers)

			
 
				-

			
 
				-    def forward(self, x):

			
 
				-        return self.layers(x)

			
 
				-

			
 
				-

			
 
				-if __name__ == "__main__":

			
 
				-    t1 = paddle.randn((1, 3, 512, 512), dtype="float32")

			
 
				-    t2 = paddle.randn((1, 3, 512, 512), dtype="float32")

			
 
				-    model = CDNet(6, 2)

			
 
				-    pred = model(t1, t2)[0]

			
 
				-    print(pred.shape)

			
--- a/paddlers/rs_models/cd/changestar.py
+++ b/paddlers/rs_models/cd/changestar.py
@@ -86,7 +86,8 @@ class ChangeStar_FarSeg(_ChangeStarBase):
 
				     The ChangeStar implementation with a FarSeg encoder based on PaddlePaddle.
			
 
				 
			
 
				     The original article refers to
			
 
				-        Z. Zheng, et al., "Change is Everywhere: Single-Temporal Supervised Object Change Detection in Remote Sensing Imagery"
			
 
				+        Z. Zheng, et al., "Change is Everywhere: Single-Temporal Supervised Object 
			
 
				+        Change Detection in Remote Sensing Imagery"
			
 
				         (https://arxiv.org/abs/2108.07002).
			
 
				     
			
 
				     Note that this implementation differs from the original code in two aspects:
			
@@ -94,12 +95,15 @@ class ChangeStar_FarSeg(_ChangeStarBase):
 
				     2. We use conv-bn-relu instead of conv-relu-bn.
			
 
				 
			
 
				     Args:
			
 
				-        num_classes (int): The number of target classes.
			
 
				-        mid_channels (int, optional): The number of channels required by the ChangeMixin module. Default: 256.
			
 
				-        inner_channels (int, optional): The number of filters used in the convolutional layers in the ChangeMixin module. 
			
 
				-            Default: 16.
			
 
				-        num_convs (int, optional): The number of convolutional layers used in the ChangeMixin module. Default: 4.
			
 
				-        scale_factor (float, optional): The scaling factor of the output upsampling layer. Default: 4.0.
			
 
				+        num_classes (int): Number of target classes.
			
 
				+        mid_channels (int, optional): Number of channels required by the 
			
 
				+        ChangeMixin module. Default: 256.
			
 
				+        inner_channels (int, optional): Number of filters used in the 
			
 
				+            convolutional layers in the ChangeMixin module. Default: 16.
			
 
				+        num_convs (int, optional): Number of convolutional layers used in the 
			
 
				+            ChangeMixin module. Default: 4.
			
 
				+        scale_factor (float, optional): Scaling factor of the output upsampling 
			
 
				+            layer. Default: 4.0.
			
 
				     """
			
 
				 
			
 
				     def __init__(
			
--- a/paddlers/rs_models/cd/dsamnet.py
+++ b/paddlers/rs_models/cd/dsamnet.py
@@ -25,19 +25,22 @@ class DSAMNet(nn.Layer):
 
				     The DSAMNet implementation based on PaddlePaddle.
			
 
				 
			
 
				     The original article refers to
			
 
				-        Q. Shi, et al., "A Deeply Supervised Attention Metric-Based Network and an Open Aerial Image Dataset for Remote Sensing 
			
 
				-        Change Detection"
			
 
				+        Q. Shi, et al., "A Deeply Supervised Attention Metric-Based Network and an 
			
 
				+        Open Aerial Image Dataset for Remote Sensing Change Detection"
			
 
				         (https://ieeexplore.ieee.org/document/9467555).
			
 
				 
			
 
				     Note that this implementation differs from the original work in two aspects:
			
 
				     1. We do not use multiple dilation rates in layer 4 of the ResNet backbone.
			
 
				-    2. A classification head is used in place of the original metric learning-based head to stablize the training process.
			
 
				+    2. A classification head is used in place of the original metric learning-based 
			
 
				+        head to stablize the training process.
			
 
				 
			
 
				     Args:
			
 
				-        in_channels (int): The number of bands of the input images.
			
 
				-        num_classes (int): The number of target classes.
			
 
				-        ca_ratio (int, optional): The channel reduction ratio for the channel attention module. Default: 8.
			
 
				-        sa_kernel (int, optional): The size of the convolutional kernel used in the spatial attention module. Default: 7.
			
 
				+        in_channels (int): Number of bands of the input images.
			
 
				+        num_classes (int): Number of target classes.
			
 
				+        ca_ratio (int, optional): Channel reduction ratio for the channel 
			
 
				+            attention module. Default: 8.
			
 
				+        sa_kernel (int, optional): Size of the convolutional kernel used in the 
			
 
				+            spatial attention module. Default: 7.
			
 
				     """
			
 
				 
			
 
				     def __init__(self, in_channels, num_classes, ca_ratio=8, sa_kernel=7):
			
--- a/paddlers/rs_models/cd/dsifn.py
+++ b/paddlers/rs_models/cd/dsifn.py
@@ -28,16 +28,17 @@ class DSIFN(nn.Layer):
 
				     The DSIFN implementation based on PaddlePaddle.
			
 
				 
			
 
				     The original article refers to
			
 
				-        C. Zhang, et al., "A deeply supervised image fusion network for change detection in high resolution bi-temporal remote 
			
 
				-        sensing images"
			
 
				+        C. Zhang, et al., "A deeply supervised image fusion network for change 
			
 
				+        detection in high resolution bi-temporal remote sensing images"
			
 
				         (https://www.sciencedirect.com/science/article/pii/S0924271620301532).
			
 
				 
			
 
				     Note that in this implementation, there is a flexible number of target classes.
			
 
				 
			
 
				     Args:
			
 
				-        num_classes (int): The number of target classes.
			
 
				-        use_dropout (bool, optional): A bool value that indicates whether to use dropout layers. When the model is trained 
			
 
				-            on a relatively small dataset, the dropout layers help prevent overfitting. Default: False.
			
 
				+        num_classes (int): Number of target classes.
			
 
				+        use_dropout (bool, optional): A bool value that indicates whether to use 
			
 
				+            dropout layers. When the model is trained on a relatively small dataset, 
			
 
				+            the dropout layers help prevent overfitting. Default: False.
			
 
				     """
			
 
				 
			
 
				     def __init__(self, num_classes, use_dropout=False):
			
--- a/paddlers/rs_models/cd/fc_ef.py
+++ b/paddlers/rs_models/cd/fc_ef.py
@@ -26,14 +26,16 @@ class FCEarlyFusion(nn.Layer):
 
				     The FC-EF implementation based on PaddlePaddle.
			
 
				 
			
 
				     The original article refers to
			
 
				-        Caye Daudt, R., et al. "Fully convolutional siamese networks for change detection"
			
 
				+        Rodrigo Caye Daudt, et al. "Fully convolutional siamese networks for change 
			
 
				+        detection"
			
 
				         (https://arxiv.org/abs/1810.08462).
			
 
				 
			
 
				     Args:
			
 
				-        in_channels (int): The number of bands of the input images.
			
 
				-        num_classes (int): The number of target classes.
			
 
				-        use_dropout (bool, optional): A bool value that indicates whether to use dropout layers. When the model is trained 
			
 
				-            on a relatively small dataset, the dropout layers help prevent overfitting. Default: False.
			
 
				+        in_channels (int): Number of bands of the input images.
			
 
				+        num_classes (int): Number of target classes.
			
 
				+        use_dropout (bool, optional): A bool value that indicates whether to use 
			
 
				+            dropout layers. When the model is trained on a relatively small dataset, 
			
 
				+            the dropout layers help prevent overfitting. Default: False.
			
 
				     """
			
 
				 
			
 
				     def __init__(self, in_channels, num_classes, use_dropout=False):
			
--- a/paddlers/rs_models/cd/fc_siam_conc.py
+++ b/paddlers/rs_models/cd/fc_siam_conc.py
@@ -26,14 +26,16 @@ class FCSiamConc(nn.Layer):
 
				     The FC-Siam-conc implementation based on PaddlePaddle.
			
 
				 
			
 
				     The original article refers to
			
 
				-        Caye Daudt, R., et al. "Fully convolutional siamese networks for change detection"
			
 
				+        Rodrigo Caye Daudt, et al. "Fully convolutional siamese networks for change 
			
 
				+        detection"
			
 
				         (https://arxiv.org/abs/1810.08462).
			
 
				 
			
 
				     Args:
			
 
				-        in_channels (int): The number of bands of the input images.
			
 
				-        num_classes (int): The number of target classes.
			
 
				-        use_dropout (bool, optional): A bool value that indicates whether to use dropout layers. When the model is trained 
			
 
				-            on a relatively small dataset, the dropout layers help prevent overfitting. Default: False.
			
 
				+        in_channels (int): Number of bands of the input images.
			
 
				+        num_classes (int): Number of target classes.
			
 
				+        use_dropout (bool, optional): A bool value that indicates whether to use 
			
 
				+            dropout layers. When the model is trained on a relatively small dataset, 
			
 
				+            the dropout layers help prevent overfitting. Default: False.
			
 
				     """
			
 
				 
			
 
				     def __init__(self, in_channels, num_classes, use_dropout=False):
			
--- a/paddlers/rs_models/cd/fc_siam_diff.py
+++ b/paddlers/rs_models/cd/fc_siam_diff.py
@@ -26,14 +26,16 @@ class FCSiamDiff(nn.Layer):
 
				     The FC-Siam-diff implementation based on PaddlePaddle.
			
 
				 
			
 
				     The original article refers to
			
 
				-        Caye Daudt, R., et al. "Fully convolutional siamese networks for change detection"
			
 
				+        Rodrigo Caye Daudt, et al. "Fully convolutional siamese networks for change 
			
 
				+        detection"
			
 
				         (https://arxiv.org/abs/1810.08462).
			
 
				 
			
 
				     Args:
			
 
				-        in_channels (int): The number of bands of the input images.
			
 
				-        num_classes (int): The number of target classes.
			
 
				-        use_dropout (bool, optional): A bool value that indicates whether to use dropout layers. When the model is trained 
			
 
				-            on a relatively small dataset, the dropout layers help prevent overfitting. Default: False.
			
 
				+        in_channels (int): Number of bands of the input images.
			
 
				+        num_classes (int): Number of target classes.
			
 
				+        use_dropout (bool, optional): A bool value that indicates whether to use 
			
 
				+            dropout layers. When the model is trained on a relatively small dataset, 
			
 
				+            the dropout layers help prevent overfitting. Default: False.
			
 
				     """
			
 
				 
			
 
				     def __init__(self, in_channels, num_classes, use_dropout=False):
			
--- a/paddlers/rs_models/cd/layers/attention.py
+++ b/paddlers/rs_models/cd/layers/attention.py
@@ -28,8 +28,8 @@ class ChannelAttention(nn.Layer):
 
				         (https://arxiv.org/abs/1807.06521).
			
 
				 
			
 
				     Args:
			
 
				-        in_ch (int): The number of channels of the input features.
			
 
				-        ratio (int, optional): The channel reduction ratio. Default: 8.
			
 
				+        in_ch (int): Number of channels of the input features.
			
 
				+        ratio (int, optional): Channel reduction ratio. Default: 8.
			
 
				     """
			
 
				 
			
 
				     def __init__(self, in_ch, ratio=8):
			
@@ -55,7 +55,8 @@ class SpatialAttention(nn.Layer):
 
				         (https://arxiv.org/abs/1807.06521).
			
 
				 
			
 
				     Args:
			
 
				-        kernel_size (int, optional): The size of the convolutional kernel. Default: 7.
			
 
				+        kernel_size (int, optional): Size of the convolutional kernel. 
			
 
				+            Default: 7.
			
 
				     """
			
 
				 
			
 
				     def __init__(self, kernel_size=7):
			
@@ -79,9 +80,11 @@ class CBAM(nn.Layer):
 
				         (https://arxiv.org/abs/1807.06521).
			
 
				 
			
 
				     Args:
			
 
				-        in_ch (int): The number of channels of the input features.
			
 
				-        ratio (int, optional): The channel reduction ratio for the channel attention module. Default: 8.
			
 
				-        kernel_size (int, optional): The size of the convolutional kernel used in the spatial attention module. Default: 7.
			
 
				+        in_ch (int): Number of channels of the input features.
			
 
				+        ratio (int, optional): Channel reduction ratio for the channel 
			
 
				+            attention module. Default: 8.
			
 
				+        kernel_size (int, optional): Size of the convolutional kernel used in 
			
 
				+            the spatial attention module. Default: 7.
			
 
				     """
			
 
				 
			
 
				     def __init__(self, in_ch, ratio=8, kernel_size=7):
			
--- a/paddlers/rs_models/cd/layers/blocks.py
+++ b/paddlers/rs_models/cd/layers/blocks.py
@@ -184,7 +184,9 @@ class ConvTransposed3x3(nn.Layer):
 
				 
			
 
				 
			
 
				 class Identity(nn.Layer):
			
 
				-    """A placeholder identity operator that accepts exactly one argument."""
			
 
				+    """
			
 
				+    A placeholder identity operator that accepts exactly one argument.
			
 
				+    """
			
 
				 
			
 
				     def __init__(self, *args, **kwargs):
			
 
				         super(Identity, self).__init__()
			
--- a/paddlers/rs_models/cd/snunet.py
+++ b/paddlers/rs_models/cd/snunet.py
@@ -27,15 +27,18 @@ class SNUNet(nn.Layer, KaimingInitMixin):
 
				     The SNUNet implementation based on PaddlePaddle.
			
 
				 
			
 
				     The original article refers to
			
 
				-        S. Fang, et al., "SNUNet-CD: A Densely Connected Siamese Network for Change Detection of VHR Images"
			
 
				+        S. Fang, et al., "SNUNet-CD: A Densely Connected Siamese Network for Change 
			
 
				+        Detection of VHR Images"
			
 
				         (https://ieeexplore.ieee.org/document/9355573).
			
 
				 
			
 
				-    Note that bilinear interpolation is adopted as the upsampling method, which is different from the paper.
			
 
				+    Note that bilinear interpolation is adopted as the upsampling method, which is 
			
 
				+        different from the paper.
			
 
				 
			
 
				     Args:
			
 
				-        in_channels (int): The number of bands of the input images.
			
 
				-        num_classes (int): The number of target classes.
			
 
				-        width (int, optional): The output channels of the first convolutional layer. Default: 32.
			
 
				+        in_channels (int): Number of bands of the input images.
			
 
				+        num_classes (int): Number of target classes.
			
 
				+        width (int, optional): Output channels of the first convolutional layer. 
			
 
				+            Default: 32.
			
 
				     """
			
 
				 
			
 
				     def __init__(self, in_channels, num_classes, width=32):
			
--- a/paddlers/rs_models/cd/stanet.py
+++ b/paddlers/rs_models/cd/stanet.py
@@ -26,23 +26,29 @@ class STANet(nn.Layer):
 
				     The STANet implementation based on PaddlePaddle.
			
 
				 
			
 
				     The original article refers to
			
 
				-        H. Chen and Z. Shi, "A Spatial-Temporal Attention-Based Method and a New Dataset for Remote Sensing Image Change Detection"
			
 
				+        H. Chen and Z. Shi, "A Spatial-Temporal Attention-Based Method and a New 
			
 
				+        Dataset for Remote Sensing Image Change Detection"
			
 
				         (https://www.mdpi.com/2072-4292/12/10/1662).
			
 
				 
			
 
				     Note that this implementation differs from the original work in two aspects:
			
 
				     1. We do not use multiple dilation rates in layer 4 of the ResNet backbone.
			
 
				-    2. A classification head is used in place of the original metric learning-based head to stablize the training process.
			
 
				+    2. A classification head is used in place of the original metric learning-based 
			
 
				+        head to stablize the training process.
			
 
				 
			
 
				     Args:
			
 
				-        in_channels (int): The number of bands of the input images.
			
 
				-        num_classes (int): The number of target classes.
			
 
				-        att_type (str, optional): The attention module used in the model. Options are 'PAM' and 'BAM'. Default: 'BAM'.
			
 
				-        ds_factor (int, optional): The downsampling factor of the attention modules. When `ds_factor` is set to values 
			
 
				-            greater than 1, the input features will first be processed by an average pooling layer with the kernel size of 
			
 
				-            `ds_factor`, before being used to calculate the attention scores. Default: 1.
			
 
				+        in_channels (int): Number of bands of the input images.
			
 
				+        num_classes (int): Number of target classes.
			
 
				+        att_type (str, optional): The attention module used in the model. Options 
			
 
				+            are 'PAM' and 'BAM'. Default: 'BAM'.
			
 
				+        ds_factor (int, optional): Downsampling factor of the attention modules. 
			
 
				+            When `ds_factor` is set to values greater than 1, the input features 
			
 
				+            will first be processed by an average pooling layer with the kernel size 
			
 
				+            of `ds_factor`, before being used to calculate the attention scores. 
			
 
				+            Default: 1.
			
 
				 
			
 
				     Raises:
			
 
				-        ValueError: When `att_type` has an illeagal value (unsupported attention type).
			
 
				+        ValueError: When `att_type` has an illeagal value (unsupported attention 
			
 
				+            type).
			
 
				     """
			
 
				 
			
 
				     def __init__(self, in_channels, num_classes, att_type='BAM', ds_factor=1):
			
--- a/paddlers/rs_models/res/rcan_model.py
+++ b/paddlers/rs_models/res/rcan_model.py
@@ -25,7 +25,8 @@ from ...models.ppgan.modules.init import reset_parameters
 
				 
			
 
				 @MODELS.register()
			
 
				 class RCANModel(BaseModel):
			
 
				-    """Base SR model for single image super-resolution.
			
 
				+    """
			
 
				+    Base SR model for single image super-resolution.
			
 
				     """
			
 
				 
			
 
				     def __init__(self, generator, pixel_criterion=None, use_init_weight=False):
			
--- a/paddlers/rs_models/seg/farseg.py
+++ b/paddlers/rs_models/seg/farseg.py
@@ -32,7 +32,7 @@ class FPN(nn.Layer):
 
				     """

			
 
				     Module that adds FPN on top of a list of feature maps.

			
 
				     The feature maps are currently supposed to be in increasing depth

			
 
				-        order, and must be consecutive

			
 
				+        order, and must be consecutive.

			
 
				     """

			
 
				 

			
 
				     def __init__(self,

			
@@ -233,13 +233,14 @@ class ResNet50Encoder(nn.Layer):
 
				 

			
 
				 

			
 
				 class FarSeg(nn.Layer):

			
 
				-    '''

			
 
				+    """

			
 
				         The FarSeg implementation based on PaddlePaddle.

			
 
				 

			
 
				         The original article refers to

			
 
				-        Zheng, Zhuo, et al. "Foreground-Aware Relation Network for Geospatial Object Segmentation in High Spatial Resolution Remote Sensing Imagery"

			
 
				+        Zheng, Zhuo, et al. "Foreground-Aware Relation Network for Geospatial Object 

			
 
				+            Segmentation in High Spatial Resolution Remote Sensing Imagery"

			
 
				         (https://openaccess.thecvf.com/content_CVPR_2020/papers/Zheng_Foreground-Aware_Relation_Network_for_Geospatial_Object_Segmentation_in_High_Spatial_CVPR_2020_paper.pdf)

			
 
				-    '''

			
 
				+    """

			
 
				 

			
 
				     def __init__(self,

			
 
				                  num_classes=16,

			
--- a/paddlers/rs_models/seg/layers/layers_lib.py
+++ b/paddlers/rs_models/seg/layers/layers_lib.py
@@ -96,16 +96,17 @@ class Activation(nn.Layer):
 
				     """

			
 
				     The wrapper of activations.

			
 
				     Args:

			
 
				-        act (str, optional): The activation name in lowercase. It must be one of ['elu', 'gelu',

			
 
				-            'hardshrink', 'tanh', 'hardtanh', 'prelu', 'relu', 'relu6', 'selu', 'leakyrelu', 'sigmoid',

			
 
				-            'softmax', 'softplus', 'softshrink', 'softsign', 'tanhshrink', 'logsigmoid', 'logsoftmax',

			
 
				+        act (str, optional): Activation name in lowercase, which must be one of 

			
 
				+            ['elu', 'gelu', 'hardshrink', 'tanh', 'hardtanh', 'prelu', 'relu', 

			
 
				+            'relu6', 'selu', 'leakyrelu', 'sigmoid', 'softmax', 'softplus', 

			
 
				+            'softshrink', 'softsign', 'tanhshrink', 'logsigmoid', 'logsoftmax',

			
 
				             'hsigmoid']. Default: None, means identical transformation.

			
 
				     Returns:

			
 
				         A callable object of Activation.

			
 
				     Raises:

			
 
				         KeyError: When parameter `act` is not in the optional range.

			
 
				     Examples:

			
 
				-        from paddleseg.models.common.activation import Activation

			
 
				+        from paddlers.rs_models.seg.layers import Activation

			
 
				         relu = Activation("relu")

			
 
				         print(relu)

			
 
				         # <class 'paddle.nn.layer.activation.ReLU'>

			
--- a/paddlers/tasks/base.py
+++ b/paddlers/tasks/base.py
@@ -126,18 +126,18 @@ class BaseModel(metaclass=ModelMeta):
 
				             if not osp.exists(osp.join(resume_checkpoint, 'model.pdparams')):
			
 
				                 logging.error(
			
 
				                     "Model parameter state dictionary file 'model.pdparams' "
			
 
				-                    "not found under given checkpoint path {}".format(
			
 
				+                    "was not found in given checkpoint path {}!".format(
			
 
				                         resume_checkpoint),
			
 
				                     exit=True)
			
 
				             if not osp.exists(osp.join(resume_checkpoint, 'model.pdopt')):
			
 
				                 logging.error(
			
 
				                     "Optimizer state dictionary file 'model.pdparams' "
			
 
				-                    "not found under given checkpoint path {}".format(
			
 
				+                    "was not found in given checkpoint path {}!".format(
			
 
				                         resume_checkpoint),
			
 
				                     exit=True)
			
 
				             if not osp.exists(osp.join(resume_checkpoint, 'model.yml')):
			
 
				                 logging.error(
			
 
				-                    "'model.yml' not found under given checkpoint path {}".
			
 
				+                    "'model.yml' was not found in given checkpoint path {}!".
			
 
				                     format(resume_checkpoint),
			
 
				                     exit=True)
			
 
				             with open(osp.join(resume_checkpoint, "model.yml")) as f:
			
@@ -264,7 +264,7 @@ class BaseModel(metaclass=ModelMeta):
 
				 
			
 
				     def build_data_loader(self, dataset, batch_size, mode='train'):
			
 
				         if dataset.num_samples < batch_size:
			
 
				-            raise Exception(
			
 
				+            raise ValueError(
			
 
				                 'The volume of dataset({}) must be larger than batch size({}).'
			
 
				                 .format(dataset.num_samples, batch_size))
			
 
				         batch_size_each_card = get_single_card_bs(batch_size=batch_size)
			
@@ -478,17 +478,21 @@ class BaseModel(metaclass=ModelMeta):
 
				                             save_dir='output'):
			
 
				         """
			
 
				         Args:
			
 
				-            dataset(paddlers.dataset): Dataset used for evaluation during sensitivity analysis.
			
 
				-            batch_size(int, optional): Batch size used in evaluation. Defaults to 8.
			
 
				-            criterion({'l1_norm', 'fpgm'}, optional): Pruning criterion. Defaults to 'l1_norm'.
			
 
				-            save_dir(str, optional): The directory to save sensitivity file of the model. Defaults to 'output'.
			
 
				+            dataset (paddlers.datasets.BaseDataset): Dataset used for evaluation during 
			
 
				+                sensitivity analysis.
			
 
				+            batch_size (int, optional): Batch size used in evaluation. Defaults to 8.
			
 
				+            criterion (str, optional): Pruning criterion. Choices are {'l1_norm', 'fpgm'}.
			
 
				+                Defaults to 'l1_norm'.
			
 
				+            save_dir (str, optional): Directory to save sensitivity file of the model. 
			
 
				+                Defaults to 'output'.
			
 
				         """
			
 
				+
			
 
				         if self.__class__.__name__ in {'FasterRCNN', 'MaskRCNN', 'PicoDet'}:
			
 
				-            raise Exception("{} does not support pruning currently!".format(
			
 
				+            raise ValueError("{} does not support pruning currently!".format(
			
 
				                 self.__class__.__name__))
			
 
				 
			
 
				         assert criterion in {'l1_norm', 'fpgm'}, \
			
 
				-            "Pruning criterion {} is not supported. Please choose from ['l1_norm', 'fpgm']"
			
 
				+            "Pruning criterion {} is not supported. Please choose from {'l1_norm', 'fpgm'}."
			
 
				         self._check_transforms(dataset.transforms, 'eval')
			
 
				         if self.model_type == 'detector':
			
 
				             self.net.eval()
			
@@ -515,13 +519,14 @@ class BaseModel(metaclass=ModelMeta):
 
				     def prune(self, pruned_flops, save_dir=None):
			
 
				         """
			
 
				         Args:
			
 
				-            pruned_flops(float): Ratio of FLOPs to be pruned.
			
 
				-            save_dir(None or str, optional): If None, the pruned model will not be saved.
			
 
				-                Otherwise, the pruned model will be saved at save_dir. Defaults to None.
			
 
				+            pruned_flops (float): Ratio of FLOPs to be pruned.
			
 
				+            save_dir (str|None, optional): If None, the pruned model will not be 
			
 
				+                saved. Otherwise, the pruned model will be saved at `save_dir`. 
			
 
				+                Defaults to None.
			
 
				         """
			
 
				         if self.status == "Pruned":
			
 
				-            raise Exception(
			
 
				-                "A pruned model cannot be done model pruning again!")
			
 
				+            raise ValueError(
			
 
				+                "A pruned model cannot be pruned for a second time!")
			
 
				         pre_pruning_flops = flops(self.net, self.pruner.inputs)
			
 
				         logging.info("Pre-pruning FLOPs: {}. Pruning starts...".format(
			
 
				             pre_pruning_flops))
			
@@ -529,8 +534,8 @@ class BaseModel(metaclass=ModelMeta):
 
				         post_pruning_flops = flops(self.net, self.pruner.inputs)
			
 
				         logging.info("Pruning is complete. Post-pruning FLOPs: {}".format(
			
 
				             post_pruning_flops))
			
 
				-        logging.warning("Pruning the model may hurt its performance, "
			
 
				-                        "retraining is highly recommended")
			
 
				+        logging.warning("Pruning the model may hurt its performance. "
			
 
				+                        "Re-training is highly recommended.")
			
 
				         self.status = 'Pruned'
			
 
				 
			
 
				         if save_dir is not None:
			
@@ -540,7 +545,7 @@ class BaseModel(metaclass=ModelMeta):
 
				     def _prepare_qat(self, quant_config):
			
 
				         if self.status == 'Infer':
			
 
				             logging.error(
			
 
				-                "Exported inference model does not support quantization aware training.",
			
 
				+                "Exported inference model does not support quantization-aware training.",
			
 
				                 exit=True)
			
 
				         if quant_config is None:
			
 
				             # default quantization configuration
			
@@ -578,7 +583,7 @@ class BaseModel(metaclass=ModelMeta):
 
				         elif quant_config != self.quant_config:
			
 
				             logging.error(
			
 
				                 "The model has been quantized with the following quant_config: {}."
			
 
				-                "Doing quantization-aware training with a quantized model "
			
 
				+                "Performing quantization-aware training with a quantized model "
			
 
				                 "using a different configuration is not supported."
			
 
				                 .format(self.quant_config),
			
 
				                 exit=True)
			
@@ -666,7 +671,7 @@ class BaseModel(metaclass=ModelMeta):
 
				 
			
 
				         # 模型保存成功的标志
			
 
				         open(osp.join(save_dir, '.success'), 'w').close()
			
 
				-        logging.info("The model for the inference deployment is saved in {}.".
			
 
				+        logging.info("The inference model for deployment is saved in {}.".
			
 
				                      format(save_dir))
			
 
				 
			
 
				     def _check_transforms(self, transforms, mode):
			
--- a/paddlers/tasks/change_detector.py
+++ b/paddlers/tasks/change_detector.py
@@ -238,29 +238,37 @@ class BaseChangeDetector(BaseModel):
 
				               resume_checkpoint=None):
			
 
				         """
			
 
				         Train the model.
			
 
				-        Args:
			
 
				-            num_epochs(int): The number of epochs.
			
 
				-            train_dataset(paddlers.dataset): Training dataset.
			
 
				-            train_batch_size(int, optional): Total batch size among all cards used in training. Defaults to 2.
			
 
				-            eval_dataset(paddlers.dataset, optional):
			
 
				-                Evaluation dataset. If None, the model will not be evaluated furing training process. Defaults to None.
			
 
				-            optimizer(paddle.optimizer.Optimizer or None, optional):
			
 
				-                Optimizer used in training. If None, a default optimizer is used. Defaults to None.
			
 
				-            save_interval_epochs(int, optional): Epoch interval for saving the model. Defaults to 1.
			
 
				-            log_interval_steps(int, optional): Step interval for printing training information. Defaults to 10.
			
 
				-            save_dir(str, optional): Directory to save the model. Defaults to 'output'.
			
 
				-            pretrain_weights(str or None, optional):
			
 
				-                None or name/path of pretrained weights. If None, no pretrained weights will be loaded. Defaults to None.
			
 
				-            learning_rate(float, optional): Learning rate for training. Defaults to .025.
			
 
				-            lr_decay_power(float, optional): Learning decay power. Defaults to .9.
			
 
				-            early_stop(bool, optional): Whether to adopt early stop strategy. Defaults to False.
			
 
				-            early_stop_patience(int, optional): Early stop patience. Defaults to 5.
			
 
				-            use_vdl(bool, optional): Whether to use VisualDL to monitor the training process. Defaults to True.
			
 
				-            resume_checkpoint(str or None, optional): The path of the checkpoint to resume training from.
			
 
				-                If None, no training checkpoint will be resumed. At most one of `resume_checkpoint` and
			
 
				-                `pretrain_weights` can be set simultaneously. Defaults to None.
			
 
				 
			
 
				+        Args:
			
 
				+            num_epochs (int): Number of epochs.
			
 
				+            train_dataset (paddlers.datasets.CDDataset): Training dataset.
			
 
				+            train_batch_size (int, optional): Total batch size among all cards used in 
			
 
				+                training. Defaults to 2.
			
 
				+            eval_dataset (paddlers.datasets.CDDataset|None, optional): Evaluation dataset. 
			
 
				+                If None, the model will not be evaluated during training process. 
			
 
				+                Defaults to None.
			
 
				+            optimizer (paddle.optimizer.Optimizer|None, optional): Optimizer used in 
			
 
				+                training. If None, a default optimizer will be used. Defaults to None.
			
 
				+            save_interval_epochs (int, optional): Epoch interval for saving the model. 
			
 
				+                Defaults to 1.
			
 
				+            log_interval_steps (int, optional): Step interval for printing training 
			
 
				+                information. Defaults to 2.
			
 
				+            save_dir (str, optional): Directory to save the model. Defaults to 'output'.
			
 
				+            pretrain_weights (str|None, optional): None or name/path of pretrained 
			
 
				+                weights. If None, no pretrained weights will be loaded. Defaults to None.
			
 
				+            learning_rate (float, optional): Learning rate for training. Defaults to .01.
			
 
				+            lr_decay_power (float, optional): Learning decay power. Defaults to .9.
			
 
				+            early_stop (bool, optional): Whether to adopt early stop strategy. Defaults 
			
 
				+                to False.
			
 
				+            early_stop_patience (int, optional): Early stop patience. Defaults to 5.
			
 
				+            use_vdl (bool, optional): Whether to use VisualDL to monitor the training 
			
 
				+                process. Defaults to True.
			
 
				+            resume_checkpoint (str|None, optional): Path of the checkpoint to resume
			
 
				+                training from. If None, no training checkpoint will be resumed. At most
			
 
				+                Aone of `resume_checkpoint` and `pretrain_weights` can be set simultaneously.
			
 
				+                Defaults to None.
			
 
				         """
			
 
				+
			
 
				         if self.status == 'Infer':
			
 
				             logging.error(
			
 
				                 "Exported inference model does not support training.",
			
@@ -336,28 +344,37 @@ class BaseChangeDetector(BaseModel):
 
				                           quant_config=None):
			
 
				         """
			
 
				         Quantization-aware training.
			
 
				-        Args:
			
 
				-            num_epochs(int): The number of epochs.
			
 
				-            train_dataset(paddlers.dataset): Training dataset.
			
 
				-            train_batch_size(int, optional): Total batch size among all cards used in training. Defaults to 2.
			
 
				-            eval_dataset(paddlers.dataset, optional):
			
 
				-                Evaluation dataset. If None, the model will not be evaluated furing training process. Defaults to None.
			
 
				-            optimizer(paddle.optimizer.Optimizer or None, optional):
			
 
				-                Optimizer used in training. If None, a default optimizer is used. Defaults to None.
			
 
				-            save_interval_epochs(int, optional): Epoch interval for saving the model. Defaults to 1.
			
 
				-            log_interval_steps(int, optional): Step interval for printing training information. Defaults to 10.
			
 
				-            save_dir(str, optional): Directory to save the model. Defaults to 'output'.
			
 
				-            learning_rate(float, optional): Learning rate for training. Defaults to .025.
			
 
				-            lr_decay_power(float, optional): Learning decay power. Defaults to .9.
			
 
				-            early_stop(bool, optional): Whether to adopt early stop strategy. Defaults to False.
			
 
				-            early_stop_patience(int, optional): Early stop patience. Defaults to 5.
			
 
				-            use_vdl(bool, optional): Whether to use VisualDL to monitor the training process. Defaults to True.
			
 
				-            quant_config(dict or None, optional): Quantization configuration. If None, a default rule of thumb
			
 
				-                configuration will be used. Defaults to None.
			
 
				-            resume_checkpoint(str or None, optional): The path of the checkpoint to resume quantization-aware training
			
 
				-                from. If None, no training checkpoint will be resumed. Defaults to None.
			
 
				 
			
 
				+        Args:
			
 
				+            num_epochs (int): Number of epochs.
			
 
				+            train_dataset (paddlers.datasets.CDDataset): Training dataset.
			
 
				+            train_batch_size (int, optional): Total batch size among all cards used in 
			
 
				+                training. Defaults to 2.
			
 
				+            eval_dataset (paddlers.datasets.CDDataset, optional): Evaluation dataset. 
			
 
				+                If None, the model will not be evaluated during training process. 
			
 
				+                Defaults to None.
			
 
				+            optimizer (paddle.optimizer.Optimizer|None, optional): Optimizer used in 
			
 
				+                training. If None, a default optimizer will be used. Defaults to None.
			
 
				+            save_interval_epochs (int, optional): Epoch interval for saving the model. 
			
 
				+                Defaults to 1.
			
 
				+            log_interval_steps (int, optional): Step interval for printing training 
			
 
				+                information. Defaults to 2.
			
 
				+            save_dir (str, optional): Directory to save the model. Defaults to 'output'.
			
 
				+            learning_rate (float, optional): Learning rate for training. 
			
 
				+                Defaults to .0001.
			
 
				+            lr_decay_power (float, optional): Learning decay power. Defaults to .9.
			
 
				+            early_stop (bool, optional): Whether to adopt early stop strategy. 
			
 
				+                Defaults to False.
			
 
				+            early_stop_patience (int, optional): Early stop patience. Defaults to 5.
			
 
				+            use_vdl (bool, optional): Whether to use VisualDL to monitor the training 
			
 
				+                process. Defaults to True.
			
 
				+            quant_config (dict|None, optional): Quantization configuration. If None, 
			
 
				+                a default rule of thumb configuration will be used. Defaults to None.
			
 
				+            resume_checkpoint (str|None, optional): Path of the checkpoint to resume
			
 
				+                quantization-aware training from. If None, no training checkpoint will
			
 
				+                be resumed. Defaults to None.
			
 
				         """
			
 
				+
			
 
				         self._prepare_qat(quant_config)
			
 
				         self.train(
			
 
				             num_epochs=num_epochs,
			
@@ -379,27 +396,32 @@ class BaseChangeDetector(BaseModel):
 
				     def evaluate(self, eval_dataset, batch_size=1, return_details=False):
			
 
				         """
			
 
				         Evaluate the model.
			
 
				+
			
 
				         Args:
			
 
				-            eval_dataset(paddlers.dataset): Evaluation dataset.
			
 
				-            batch_size(int, optional): Total batch size among all cards used for evaluation. Defaults to 1.
			
 
				-            return_details(bool, optional): Whether to return evaluation details. Defaults to False.
			
 
				+            eval_dataset (paddlers.datasets.CDDataset): Evaluation dataset.
			
 
				+            batch_size (int, optional): Total batch size among all cards used for 
			
 
				+                evaluation. Defaults to 1.
			
 
				+            return_details (bool, optional): Whether to return evaluation details. 
			
 
				+                Defaults to False.
			
 
				 
			
 
				         Returns:
			
 
				             collections.OrderedDict with key-value pairs:
			
 
				-                For binary change detection (number of classes == 2), the key-value pairs are like:
			
 
				-                {"iou": `intersection over union for the change class`,
			
 
				-                 "f1": `F1 score for the change class`,
			
 
				-                 "oacc": `overall accuracy`,
			
 
				-                 "kappa": ` kappa coefficient`}.
			
 
				-                For multi-class change detection (number of classes > 2), the key-value pairs are like:
			
 
				-                {"miou": `mean intersection over union`,
			
 
				-                 "category_iou": `category-wise mean intersection over union`,
			
 
				-                 "oacc": `overall accuracy`,
			
 
				-                 "category_acc": `category-wise accuracy`,
			
 
				-                 "kappa": ` kappa coefficient`,
			
 
				-                 "category_F1-score": `F1 score`}.
			
 
				-
			
 
				+                For binary change detection (number of classes == 2), the key-value 
			
 
				+                    pairs are like:
			
 
				+                    {"iou": `intersection over union for the change class`,
			
 
				+                    "f1": `F1 score for the change class`,
			
 
				+                    "oacc": `overall accuracy`,
			
 
				+                    "kappa": ` kappa coefficient`}.
			
 
				+                For multi-class change detection (number of classes > 2), the key-value 
			
 
				+                    pairs are like:
			
 
				+                    {"miou": `mean intersection over union`,
			
 
				+                    "category_iou": `category-wise mean intersection over union`,
			
 
				+                    "oacc": `overall accuracy`,
			
 
				+                    "category_acc": `category-wise accuracy`,
			
 
				+                    "kappa": ` kappa coefficient`,
			
 
				+                    "category_F1-score": `F1 score`}.
			
 
				         """
			
 
				+
			
 
				         self._check_transforms(eval_dataset.transforms, 'eval')
			
 
				 
			
 
				         self.net.eval()
			
@@ -500,24 +522,27 @@ class BaseChangeDetector(BaseModel):
 
				     def predict(self, img_file, transforms=None):
			
 
				         """
			
 
				         Do inference.
			
 
				+
			
 
				         Args:
			
 
				-            Args:
			
 
				-            img_file (list[tuple] | tuple[str | np.ndarray]):
			
 
				-                Tuple of image paths or decoded image data for bi-temporal images, which also could constitute a list,
			
 
				-                meaning all image pairs to be predicted as a mini-batch.
			
 
				-            transforms(paddlers.transforms.Compose or None, optional):
			
 
				-                Transforms for inputs. If None, the transforms for evaluation process will be used. Defaults to None.
			
 
				+            img_file (list[tuple] | tuple[str|np.ndarray]): Tuple of image paths or 
			
 
				+                decoded image data for bi-temporal images, which also could constitute
			
 
				+                a list, meaning all image pairs to be predicted as a mini-batch.
			
 
				+            transforms (paddlers.transforms.Compose|None, optional): Transforms for 
			
 
				+                inputs. If None, the transforms for evaluation process will be used. 
			
 
				+                Defaults to None.
			
 
				 
			
 
				         Returns:
			
 
				-            If img_file is a tuple of string or np.array, the result is a dict with key-value pairs:
			
 
				-            {"label map": `label map`, "score_map": `score map`}.
			
 
				-            If img_file is a list, the result is a list composed of dicts with the corresponding fields:
			
 
				-            label_map(np.ndarray): the predicted label map (HW)
			
 
				-            score_map(np.ndarray): the prediction score map (HWC)
			
 
				-
			
 
				+            If `img_file` is a tuple of string or np.array, the result is a dict with 
			
 
				+                key-value pairs:
			
 
				+                {"label map": `label map`, "score_map": `score map`}.
			
 
				+            If `img_file` is a list, the result is a list composed of dicts with the 
			
 
				+                corresponding fields:
			
 
				+                label_map (np.ndarray): the predicted label map (HW)
			
 
				+                score_map (np.ndarray): the prediction score map (HWC)
			
 
				         """
			
 
				+
			
 
				         if transforms is None and not hasattr(self, 'test_transforms'):
			
 
				-            raise Exception("transforms need to be defined, now is None.")
			
 
				+            raise ValueError("transforms need to be defined, now is None.")
			
 
				         if transforms is None:
			
 
				             transforms = self.test_transforms
			
 
				         if isinstance(img_file, tuple):
			
@@ -555,26 +580,24 @@ class BaseChangeDetector(BaseModel):
 
				                        transforms=None):
			
 
				         """
			
 
				         Do inference.
			
 
				+
			
 
				         Args:
			
 
				-            Args:
			
 
				-            img_file(list[str]):
			
 
				-                List of image paths.
			
 
				-            save_dir(str):
			
 
				-                Directory that contains saved geotiff file.
			
 
				-            block_size(list[int] | tuple[int] | int, optional):
			
 
				-                Size of block.
			
 
				-            overlap(list[int] | tuple[int] | int, optional):
			
 
				-                Overlap between two blocks. Defaults to 36.
			
 
				-            transforms(paddlers.transforms.Compose or None, optional):
			
 
				-                Transforms for inputs. If None, the transforms for evaluation process will be used. Defaults to None.
			
 
				+            img_file (tuple[str]): Tuple of image paths.
			
 
				+            save_dir (str): Directory that contains saved geotiff file.
			
 
				+            block_size (list[int] | tuple[int] | int, optional): Size of block.
			
 
				+            overlap (list[int] | tuple[int] | int, optional): Overlap between two blocks. 
			
 
				+                Defaults to 36.
			
 
				+            transforms (paddlers.transforms.Compose|None, optional): Transforms for inputs.
			
 
				+                If None, the transforms for evaluation process will be used. Defaults to None.
			
 
				         """
			
 
				+
			
 
				         try:
			
 
				             from osgeo import gdal
			
 
				         except:
			
 
				             import gdal
			
 
				 
			
 
				-        if len(img_file) != 2:
			
 
				-            raise ValueError("`img_file` must be a list of length 2.")
			
 
				+        if not isinstance(img_file, tuple) or len(img_file) != 2:
			
 
				+            raise ValueError("`img_file` must be a tuple of length 2.")
			
 
				         if isinstance(block_size, int):
			
 
				             block_size = (block_size, block_size)
			
 
				         elif isinstance(block_size, (tuple, list)) and len(block_size) == 2:
			
--- a/paddlers/tasks/classifier.py
+++ b/paddlers/tasks/classifier.py
@@ -52,7 +52,7 @@ class BaseClassifier(BaseModel):
 
				         super(BaseClassifier, self).__init__('classifier')
			
 
				         if not hasattr(paddleclas.arch.backbone, model_name) and \
			
 
				            not hasattr(cmcls, model_name):
			
 
				-            raise Exception("ERROR: There's no model named {}.".format(
			
 
				+            raise ValueError("ERROR: There is no model named {}.".format(
			
 
				                 model_name))
			
 
				         self.model_name = model_name
			
 
				         self.in_channels = in_channels
			
@@ -202,29 +202,39 @@ class BaseClassifier(BaseModel):
 
				               resume_checkpoint=None):
			
 
				         """
			
 
				         Train the model.
			
 
				-        Args:
			
 
				-            num_epochs(int): The number of epochs.
			
 
				-            train_dataset(paddlers.dataset): Training dataset.
			
 
				-            train_batch_size(int, optional): Total batch size among all cards used in training. Defaults to 2.
			
 
				-            eval_dataset(paddlers.dataset, optional):
			
 
				-                Evaluation dataset. If None, the model will not be evaluated furing training process. Defaults to None.
			
 
				-            optimizer(paddle.optimizer.Optimizer or None, optional):
			
 
				-                Optimizer used in training. If None, a default optimizer is used. Defaults to None.
			
 
				-            save_interval_epochs(int, optional): Epoch interval for saving the model. Defaults to 1.
			
 
				-            log_interval_steps(int, optional): Step interval for printing training information. Defaults to 10.
			
 
				-            save_dir(str, optional): Directory to save the model. Defaults to 'output'.
			
 
				-            pretrain_weights(str or None, optional):
			
 
				-                None or name/path of pretrained weights. If None, no pretrained weights will be loaded. Defaults to 'CITYSCAPES'.
			
 
				-            learning_rate(float, optional): Learning rate for training. Defaults to .025.
			
 
				-            lr_decay_power(float, optional): Learning decay power. Defaults to .9.
			
 
				-            early_stop(bool, optional): Whether to adopt early stop strategy. Defaults to False.
			
 
				-            early_stop_patience(int, optional): Early stop patience. Defaults to 5.
			
 
				-            use_vdl(bool, optional): Whether to use VisualDL to monitor the training process. Defaults to True.
			
 
				-            resume_checkpoint(str or None, optional): The path of the checkpoint to resume training from.
			
 
				-                If None, no training checkpoint will be resumed. At most one of `resume_checkpoint` and
			
 
				-                `pretrain_weights` can be set simultaneously. Defaults to None.
			
 
				 
			
 
				+        Args:
			
 
				+            num_epochs (int): Number of epochs.
			
 
				+            train_dataset (paddlers.datasets.ClasDataset): Training dataset.
			
 
				+            train_batch_size (int, optional): Total batch size among all cards used in 
			
 
				+                training. Defaults to 2.
			
 
				+            eval_dataset (paddlers.datasets.ClasDataset, optional): Evaluation dataset. 
			
 
				+                If None, the model will not be evaluated during training process. 
			
 
				+                Defaults to None.
			
 
				+            optimizer (paddle.optimizer.Optimizer|None, optional): Optimizer used in 
			
 
				+                training. If None, a default optimizer will be used. Defaults to None.
			
 
				+            save_interval_epochs (int, optional): Epoch interval for saving the model. 
			
 
				+                Defaults to 1.
			
 
				+            log_interval_steps (int, optional): Step interval for printing training 
			
 
				+                information. Defaults to 2.
			
 
				+            save_dir (str, optional): Directory to save the model. Defaults to 'output'.
			
 
				+            pretrain_weights (str|None, optional): None or name/path of pretrained 
			
 
				+                weights. If None, no pretrained weights will be loaded. 
			
 
				+                Defaults to 'IMAGENET'.
			
 
				+            learning_rate (float, optional): Learning rate for training. 
			
 
				+                Defaults to .1.
			
 
				+            lr_decay_power (float, optional): Learning decay power. Defaults to .9.
			
 
				+            early_stop (bool, optional): Whether to adopt early stop strategy. 
			
 
				+                Defaults to False.
			
 
				+            early_stop_patience (int, optional): Early stop patience. Defaults to 5.
			
 
				+            use_vdl (bool, optional): Whether to use VisualDL to monitor the training 
			
 
				+                process. Defaults to True.
			
 
				+            resume_checkpoint (str|None, optional): Path of the checkpoint to resume
			
 
				+                training from. If None, no training checkpoint will be resumed. At most
			
 
				+                Aone of `resume_checkpoint` and `pretrain_weights` can be set simultaneously.
			
 
				+                Defaults to None.
			
 
				         """
			
 
				+
			
 
				         if self.status == 'Infer':
			
 
				             logging.error(
			
 
				                 "Exported inference model does not support training.",
			
@@ -303,28 +313,37 @@ class BaseClassifier(BaseModel):
 
				                           quant_config=None):
			
 
				         """
			
 
				         Quantization-aware training.
			
 
				-        Args:
			
 
				-            num_epochs(int): The number of epochs.
			
 
				-            train_dataset(paddlers.dataset): Training dataset.
			
 
				-            train_batch_size(int, optional): Total batch size among all cards used in training. Defaults to 2.
			
 
				-            eval_dataset(paddlers.dataset, optional):
			
 
				-                Evaluation dataset. If None, the model will not be evaluated furing training process. Defaults to None.
			
 
				-            optimizer(paddle.optimizer.Optimizer or None, optional):
			
 
				-                Optimizer used in training. If None, a default optimizer is used. Defaults to None.
			
 
				-            save_interval_epochs(int, optional): Epoch interval for saving the model. Defaults to 1.
			
 
				-            log_interval_steps(int, optional): Step interval for printing training information. Defaults to 10.
			
 
				-            save_dir(str, optional): Directory to save the model. Defaults to 'output'.
			
 
				-            learning_rate(float, optional): Learning rate for training. Defaults to .025.
			
 
				-            lr_decay_power(float, optional): Learning decay power. Defaults to .9.
			
 
				-            early_stop(bool, optional): Whether to adopt early stop strategy. Defaults to False.
			
 
				-            early_stop_patience(int, optional): Early stop patience. Defaults to 5.
			
 
				-            use_vdl(bool, optional): Whether to use VisualDL to monitor the training process. Defaults to True.
			
 
				-            quant_config(dict or None, optional): Quantization configuration. If None, a default rule of thumb
			
 
				-                configuration will be used. Defaults to None.
			
 
				-            resume_checkpoint(str or None, optional): The path of the checkpoint to resume quantization-aware training
			
 
				-                from. If None, no training checkpoint will be resumed. Defaults to None.
			
 
				 
			
 
				+        Args:
			
 
				+            num_epochs (int): Number of epochs.
			
 
				+            train_dataset (paddlers.datasets.ClasDataset): Training dataset.
			
 
				+            train_batch_size (int, optional): Total batch size among all cards used in 
			
 
				+                training. Defaults to 2.
			
 
				+            eval_dataset (paddlers.datasets.ClasDataset, optional): Evaluation dataset. 
			
 
				+                If None, the model will not be evaluated during training process. 
			
 
				+                Defaults to None.
			
 
				+            optimizer (paddle.optimizer.Optimizer|None, optional): Optimizer used in 
			
 
				+                training. If None, a default optimizer will be used. Defaults to None.
			
 
				+            save_interval_epochs (int, optional): Epoch interval for saving the model. 
			
 
				+                Defaults to 1.
			
 
				+            log_interval_steps (int, optional): Step interval for printing training 
			
 
				+                information. Defaults to 2.
			
 
				+            save_dir (str, optional): Directory to save the model. Defaults to 'output'.
			
 
				+            learning_rate (float, optional): Learning rate for training. 
			
 
				+                Defaults to .0001.
			
 
				+            lr_decay_power (float, optional): Learning decay power. Defaults to .9.
			
 
				+            early_stop (bool, optional): Whether to adopt early stop strategy. 
			
 
				+                Defaults to False.
			
 
				+            early_stop_patience (int, optional): Early stop patience. Defaults to 5.
			
 
				+            use_vdl (bool, optional): Whether to use VisualDL to monitor the training 
			
 
				+                process. Defaults to True.
			
 
				+            quant_config (dict|None, optional): Quantization configuration. If None, 
			
 
				+                a default rule of thumb configuration will be used. Defaults to None.
			
 
				+            resume_checkpoint (str|None, optional): Path of the checkpoint to resume
			
 
				+                quantization-aware training from. If None, no training checkpoint will
			
 
				+                be resumed. Defaults to None.
			
 
				         """
			
 
				+
			
 
				         self._prepare_qat(quant_config)
			
 
				         self.train(
			
 
				             num_epochs=num_epochs,
			
@@ -346,17 +365,20 @@ class BaseClassifier(BaseModel):
 
				     def evaluate(self, eval_dataset, batch_size=1, return_details=False):
			
 
				         """
			
 
				         Evaluate the model.
			
 
				+
			
 
				         Args:
			
 
				-            eval_dataset(paddlers.dataset): Evaluation dataset.
			
 
				-            batch_size(int, optional): Total batch size among all cards used for evaluation. Defaults to 1.
			
 
				-            return_details(bool, optional): Whether to return evaluation details. Defaults to False.
			
 
				+            eval_dataset (paddlers.datasets.ClasDataset): Evaluation dataset.
			
 
				+            batch_size (int, optional): Total batch size among all cards used for 
			
 
				+                evaluation. Defaults to 1.
			
 
				+            return_details (bool, optional): Whether to return evaluation details. 
			
 
				+                Defaults to False.
			
 
				 
			
 
				         Returns:
			
 
				             collections.OrderedDict with key-value pairs:
			
 
				                 {"top1": `acc of top1`,
			
 
				                  "top5": `acc of top5`}.
			
 
				-
			
 
				         """
			
 
				+
			
 
				         self._check_transforms(eval_dataset.transforms, 'eval')
			
 
				 
			
 
				         self.net.eval()
			
@@ -404,25 +426,28 @@ class BaseClassifier(BaseModel):
 
				     def predict(self, img_file, transforms=None):
			
 
				         """
			
 
				         Do inference.
			
 
				+
			
 
				         Args:
			
 
				-            Args:
			
 
				-            img_file(list[np.ndarray | str] | str | np.ndarray):
			
 
				-                Image path or decoded image data, which also could constitute a list, meaning all images to be 
			
 
				+            img_file (list[np.ndarray|str] | str | np.ndarray): Image path or decoded 
			
 
				+                image data, which also could constitute a list, meaning all images to be 
			
 
				                 predicted as a mini-batch.
			
 
				-            transforms(paddlers.transforms.Compose or None, optional):
			
 
				-                Transforms for inputs. If None, the transforms for evaluation process will be used. Defaults to None.
			
 
				+            transforms (paddlers.transforms.Compose|None, optional): Transforms for 
			
 
				+                inputs. If None, the transforms for evaluation process will be used. 
			
 
				+                Defaults to None.
			
 
				 
			
 
				         Returns:
			
 
				-            If img_file is a string or np.array, the result is a dict with key-value pairs:
			
 
				-            {"label map": `class_ids_map`, "scores_map": `label_names_map`}.
			
 
				-            If img_file is a list, the result is a list composed of dicts with the corresponding fields:
			
 
				-            class_ids_map(np.ndarray): class_ids
			
 
				-            scores_map(np.ndarray): scores
			
 
				-            label_names_map(np.ndarray): label_names
			
 
				-
			
 
				+            If `img_file` is a string or np.array, the result is a dict with key-value 
			
 
				+                pairs:
			
 
				+                {"label map": `class_ids_map`, "scores_map": `label_names_map`}.
			
 
				+            If `img_file` is a list, the result is a list composed of dicts with the 
			
 
				+                corresponding fields:
			
 
				+                class_ids_map (np.ndarray): class_ids
			
 
				+                scores_map (np.ndarray): scores
			
 
				+                label_names_map (np.ndarray): label_names
			
 
				         """
			
 
				+
			
 
				         if transforms is None and not hasattr(self, 'test_transforms'):
			
 
				-            raise Exception("transforms need to be defined, now is None.")
			
 
				+            raise ValueError("transforms need to be defined, now is None.")
			
 
				         if transforms is None:
			
 
				             transforms = self.test_transforms
			
 
				         if isinstance(img_file, (str, np.ndarray)):
			
--- a/paddlers/tasks/load_model.py
+++ b/paddlers/tasks/load_model.py
@@ -52,7 +52,7 @@ def load_model(model_dir, **params):
 
				     Load saved model from a given directory.
			
 
				 
			
 
				     Args:
			
 
				-        model_dir(str): The directory where the model is saved.
			
 
				+        model_dir(str): Directory where the model is saved.
			
 
				 
			
 
				     Returns:
			
 
				         The model loaded from the directory.
			
@@ -61,8 +61,8 @@ def load_model(model_dir, **params):
 
				     if not osp.exists(model_dir):
			
 
				         logging.error("Directory '{}' does not exist!".format(model_dir))
			
 
				     if not osp.exists(osp.join(model_dir, "model.yml")):
			
 
				-        raise Exception("There is no file named model.yml in {}.".format(
			
 
				-            model_dir))
			
 
				+        raise FileNotFoundError(
			
 
				+            "There is no file named model.yml in {}.".format(model_dir))
			
 
				 
			
 
				     with open(osp.join(model_dir, "model.yml")) as f:
			
 
				         model_info = yaml.load(f.read(), Loader=yaml.Loader)
			
@@ -76,7 +76,7 @@ def load_model(model_dir, **params):
 
				     model_type = model_info['_Attributes']['model_type']
			
 
				     mod = getattr(paddlers.tasks, model_type)
			
 
				     if not hasattr(mod, model_info['Model']):
			
 
				-        raise Exception("There is no {} attribute in {}.".format(model_info[
			
 
				+        raise ValueError("There is no {} attribute in {}.".format(model_info[
			
 
				             'Model'], mod))
			
 
				     if 'model_name' in model_info['_init_params']:
			
 
				         del model_info['_init_params']['model_name']
			
--- a/paddlers/tasks/object_detector.py
+++ b/paddlers/tasks/object_detector.py
@@ -81,7 +81,7 @@ class BaseDetector(BaseModel):
 
				         if len(image_shape) == 2:
			
 
				             image_shape = [1, 3] + image_shape
			
 
				         if image_shape[-2] % 32 > 0 or image_shape[-1] % 32 > 0:
			
 
				-            raise Exception(
			
 
				+            raise ValueError(
			
 
				                 "Height and width in fixed_input_shape must be a multiple of 32, but received {}.".
			
 
				                 format(image_shape[-2:]))
			
 
				         return image_shape
			
@@ -206,34 +206,51 @@ class BaseDetector(BaseModel):
 
				               resume_checkpoint=None):
			
 
				         """
			
 
				         Train the model.
			
 
				+
			
 
				         Args:
			
 
				-            num_epochs(int): The number of epochs.
			
 
				-            train_dataset(paddlers.dataset): Training dataset.
			
 
				-            train_batch_size(int, optional): Total batch size among all cards used in training. Defaults to 64.
			
 
				-            eval_dataset(paddlers.dataset, optional):
			
 
				-                Evaluation dataset. If None, the model will not be evaluated during training process. Defaults to None.
			
 
				-            optimizer(paddle.optimizer.Optimizer or None, optional):
			
 
				-                Optimizer used for training. If None, a default optimizer is used. Defaults to None.
			
 
				-            save_interval_epochs(int, optional): Epoch interval for saving the model. Defaults to 1.
			
 
				-            log_interval_steps(int, optional): Step interval for printing training information. Defaults to 10.
			
 
				-            save_dir(str, optional): Directory to save the model. Defaults to 'output'.
			
 
				-            pretrain_weights(str or None, optional):
			
 
				-                None or name/path of pretrained weights. If None, no pretrained weights will be loaded. Defaults to 'IMAGENET'.
			
 
				-            learning_rate(float, optional): Learning rate for training. Defaults to .001.
			
 
				-            warmup_steps(int, optional): The number of steps of warm-up training. Defaults to 0.
			
 
				-            warmup_start_lr(float, optional): Start learning rate of warm-up training. Defaults to 0..
			
 
				-            lr_decay_epochs(list or tuple, optional): Epoch milestones for learning rate decay. Defaults to (216, 243).
			
 
				-            lr_decay_gamma(float, optional): Gamma coefficient of learning rate decay. Defaults to .1.
			
 
				-            metric({'VOC', 'COCO', None}, optional):
			
 
				-                Evaluation metric. If None, determine the metric according to the dataset format. Defaults to None.
			
 
				-            use_ema(bool, optional): Whether to use exponential moving average strategy. Defaults to False.
			
 
				-            early_stop(bool, optional): Whether to adopt early stop strategy. Defaults to False.
			
 
				-            early_stop_patience(int, optional): Early stop patience. Defaults to 5.
			
 
				-            use_vdl(bool, optional): Whether to use VisualDL to monitor the training process. Defaults to True.
			
 
				-            resume_checkpoint(str or None, optional): The path of the checkpoint to resume training from.
			
 
				-                If None, no training checkpoint will be resumed. At most one of `resume_checkpoint` and
			
 
				-                `pretrain_weights` can be set simultaneously. Defaults to None.
			
 
				+            num_epochs (int): Number of epochs.
			
 
				+            train_dataset (paddlers.datasets.COCODetDataset|paddlers.datasets.VOCDetDataset): 
			
 
				+                Training dataset.
			
 
				+            train_batch_size (int, optional): Total batch size among all cards used in 
			
 
				+                training. Defaults to 64.
			
 
				+            eval_dataset (paddlers.datasets.COCODetDataset|paddlers.datasets.VOCDetDataset, optional): 
			
 
				+                Evaluation dataset. If None, the model will not be evaluated during training 
			
 
				+                process. Defaults to None.
			
 
				+            optimizer (paddle.optimizer.Optimizer|None, optional): Optimizer used for 
			
 
				+                training. If None, a default optimizer will be used. Defaults to None.
			
 
				+            save_interval_epochs (int, optional): Epoch interval for saving the model. 
			
 
				+                Defaults to 1.
			
 
				+            log_interval_steps (int, optional): Step interval for printing training 
			
 
				+                information. Defaults to 10.
			
 
				+            save_dir (str, optional): Directory to save the model. Defaults to 'output'.
			
 
				+            pretrain_weights (str|None, optional): None or name/path of pretrained 
			
 
				+                weights. If None, no pretrained weights will be loaded. 
			
 
				+                Defaults to 'IMAGENET'.
			
 
				+            learning_rate (float, optional): Learning rate for training. Defaults to .001.
			
 
				+            warmup_steps (int, optional): Number of steps of warm-up training. 
			
 
				+                Defaults to 0.
			
 
				+            warmup_start_lr (float, optional): Start learning rate of warm-up training. 
			
 
				+                Defaults to 0..
			
 
				+            lr_decay_epochs (list|tuple, optional): Epoch milestones for learning 
			
 
				+                rate decay. Defaults to (216, 243).
			
 
				+            lr_decay_gamma (float, optional): Gamma coefficient of learning rate decay. 
			
 
				+                Defaults to .1.
			
 
				+            metric (str|None, optional): Evaluation metric. Choices are {'VOC', 'COCO', None}. 
			
 
				+                If None, determine the metric according to the  dataset format. 
			
 
				+                Defaults to None.
			
 
				+            use_ema (bool, optional): Whether to use exponential moving average 
			
 
				+                strategy. Defaults to False.
			
 
				+            early_stop (bool, optional): Whether to adopt early stop strategy. 
			
 
				+                Defaults to False.
			
 
				+            early_stop_patience (int, optional): Early stop patience. Defaults to 5.
			
 
				+            use_vdl(bool, optional): Whether to use VisualDL to monitor the training 
			
 
				+                process. Defaults to True.
			
 
				+            resume_checkpoint (str|None, optional): Path of the checkpoint to resume
			
 
				+                training from. If None, no training checkpoint will be resumed. At most
			
 
				+                Aone of `resume_checkpoint` and `pretrain_weights` can be set simultaneously.
			
 
				+                Defaults to None.
			
 
				         """
			
 
				+
			
 
				         if self.status == 'Infer':
			
 
				             logging.error(
			
 
				                 "Exported inference model does not support training.",
			
@@ -242,7 +259,7 @@ class BaseDetector(BaseModel):
 
				             logging.error(
			
 
				                 "pretrain_weights and resume_checkpoint cannot be set simultaneously.",
			
 
				                 exit=True)
			
 
				-        if train_dataset.__class__.__name__ == 'VOCDetection':
			
 
				+        if train_dataset.__class__.__name__ == 'VOCDetDataset':
			
 
				             train_dataset.data_fields = {
			
 
				                 'im_id', 'image_shape', 'image', 'gt_bbox', 'gt_class',
			
 
				                 'difficult'
			
@@ -260,13 +277,13 @@ class BaseDetector(BaseModel):
 
				                 }
			
 
				 
			
 
				         if metric is None:
			
 
				-            if eval_dataset.__class__.__name__ == 'VOCDetection':
			
 
				+            if eval_dataset.__class__.__name__ == 'VOCDetDataset':
			
 
				                 self.metric = 'voc'
			
 
				-            elif eval_dataset.__class__.__name__ == 'CocoDetection':
			
 
				+            elif eval_dataset.__class__.__name__ == 'COCODetDataset':
			
 
				                 self.metric = 'coco'
			
 
				         else:
			
 
				             assert metric.lower() in ['coco', 'voc'], \
			
 
				-                "Evaluation metric {} is not supported, please choose form 'COCO' and 'VOC'"
			
 
				+                "Evaluation metric {} is not supported. Please choose from 'COCO' and 'VOC'."
			
 
				             self.metric = metric.lower()
			
 
				 
			
 
				         self.labels = train_dataset.labels
			
@@ -355,33 +372,50 @@ class BaseDetector(BaseModel):
 
				                           quant_config=None):
			
 
				         """
			
 
				         Quantization-aware training.
			
 
				+
			
 
				         Args:
			
 
				-            num_epochs(int): The number of epochs.
			
 
				-            train_dataset(paddlers.dataset): Training dataset.
			
 
				-            train_batch_size(int, optional): Total batch size among all cards used in training. Defaults to 64.
			
 
				-            eval_dataset(paddlers.dataset, optional):
			
 
				-                Evaluation dataset. If None, the model will not be evaluated during training process. Defaults to None.
			
 
				-            optimizer(paddle.optimizer.Optimizer or None, optional):
			
 
				-                Optimizer used for training. If None, a default optimizer is used. Defaults to None.
			
 
				-            save_interval_epochs(int, optional): Epoch interval for saving the model. Defaults to 1.
			
 
				-            log_interval_steps(int, optional): Step interval for printing training information. Defaults to 10.
			
 
				-            save_dir(str, optional): Directory to save the model. Defaults to 'output'.
			
 
				-            learning_rate(float, optional): Learning rate for training. Defaults to .001.
			
 
				-            warmup_steps(int, optional): The number of steps of warm-up training. Defaults to 0.
			
 
				-            warmup_start_lr(float, optional): Start learning rate of warm-up training. Defaults to 0..
			
 
				-            lr_decay_epochs(list or tuple, optional): Epoch milestones for learning rate decay. Defaults to (216, 243).
			
 
				-            lr_decay_gamma(float, optional): Gamma coefficient of learning rate decay. Defaults to .1.
			
 
				-            metric({'VOC', 'COCO', None}, optional):
			
 
				-                Evaluation metric. If None, determine the metric according to the dataset format. Defaults to None.
			
 
				-            use_ema(bool, optional): Whether to use exponential moving average strategy. Defaults to False.
			
 
				-            early_stop(bool, optional): Whether to adopt early stop strategy. Defaults to False.
			
 
				-            early_stop_patience(int, optional): Early stop patience. Defaults to 5.
			
 
				-            use_vdl(bool, optional): Whether to use VisualDL to monitor the training process. Defaults to True.
			
 
				-            quant_config(dict or None, optional): Quantization configuration. If None, a default rule of thumb
			
 
				-                configuration will be used. Defaults to None.
			
 
				-            resume_checkpoint(str or None, optional): The path of the checkpoint to resume quantization-aware training
			
 
				-                from. If None, no training checkpoint will be resumed. Defaults to None.
			
 
				+            num_epochs (int): Number of epochs.
			
 
				+            train_dataset (paddlers.datasets.COCODetDataset|paddlers.datasets.VOCDetDataset): 
			
 
				+                Training dataset.
			
 
				+            train_batch_size (int, optional): Total batch size among all cards used in 
			
 
				+                training. Defaults to 64.
			
 
				+            eval_dataset (paddlers.datasets.COCODetDataset|paddlers.datasets.VOCDetDataset, optional): 
			
 
				+                Evaluation dataset. If None, the model will not be evaluated during training 
			
 
				+                process. Defaults to None.
			
 
				+            optimizer (paddle.optimizer.Optimizer or None, optional): Optimizer used for 
			
 
				+                training. If None, a default optimizer will be used. Defaults to None.
			
 
				+            save_interval_epochs (int, optional): Epoch interval for saving the model. 
			
 
				+                Defaults to 1.
			
 
				+            log_interval_steps (int, optional): Step interval for printing training 
			
 
				+                information. Defaults to 10.
			
 
				+            save_dir (str, optional): Directory to save the model. Defaults to 'output'.
			
 
				+            learning_rate (float, optional): Learning rate for training. 
			
 
				+                Defaults to .00001.
			
 
				+            warmup_steps (int, optional): Number of steps of warm-up training. 
			
 
				+                Defaults to 0.
			
 
				+            warmup_start_lr (float, optional): Start learning rate of warm-up training. 
			
 
				+                Defaults to 0..
			
 
				+            lr_decay_epochs (list or tuple, optional): Epoch milestones for learning rate 
			
 
				+                decay. Defaults to (216, 243).
			
 
				+            lr_decay_gamma (float, optional): Gamma coefficient of learning rate decay. 
			
 
				+                Defaults to .1.
			
 
				+            metric (str|None, optional): Evaluation metric. Choices are {'VOC', 'COCO', None}. 
			
 
				+                If None, determine the metric according to the dataset format. 
			
 
				+                Defaults to None.
			
 
				+            use_ema (bool, optional): Whether to use exponential moving average strategy. 
			
 
				+                Defaults to False.
			
 
				+            early_stop (bool, optional): Whether to adopt early stop strategy. 
			
 
				+                Defaults to False.
			
 
				+            early_stop_patience (int, optional): Early stop patience. Defaults to 5.
			
 
				+            use_vdl (bool, optional): Whether to use VisualDL to monitor the training 
			
 
				+                process. Defaults to True.
			
 
				+            quant_config (dict or None, optional): Quantization configuration. If None, 
			
 
				+                a default rule of thumb configuration will be used. Defaults to None.
			
 
				+            resume_checkpoint (str|None, optional): Path of the checkpoint to resume
			
 
				+                quantization-aware training from. If None, no training checkpoint will
			
 
				+                be resumed. Defaults to None.
			
 
				         """
			
 
				+
			
 
				         self._prepare_qat(quant_config)
			
 
				         self.train(
			
 
				             num_epochs=num_epochs,
			
@@ -412,25 +446,32 @@ class BaseDetector(BaseModel):
 
				                  return_details=False):
			
 
				         """
			
 
				         Evaluate the model.
			
 
				+
			
 
				         Args:
			
 
				-            eval_dataset(paddlers.dataset): Evaluation dataset.
			
 
				-            batch_size(int, optional): Total batch size among all cards used for evaluation. Defaults to 1.
			
 
				-            metric({'VOC', 'COCO', None}, optional):
			
 
				-                Evaluation metric. If None, determine the metric according to the dataset format. Defaults to None.
			
 
				-            return_details(bool, optional): Whether to return evaluation details. Defaults to False.
			
 
				+            eval_dataset (paddlers.datasets.COCODetDataset|paddlers.datasets.VOCDetDataset): 
			
 
				+                Evaluation dataset.
			
 
				+            batch_size (int, optional): Total batch size among all cards used for 
			
 
				+                evaluation. Defaults to 1.
			
 
				+            metric (str|None, optional): Evaluation metric. Choices are {'VOC', 'COCO', None}. 
			
 
				+                If None, determine the metric according to the dataset format. 
			
 
				+                Defaults to None.
			
 
				+            return_details (bool, optional): Whether to return evaluation details. 
			
 
				+                Defaults to False.
			
 
				+
			
 
				         Returns:
			
 
				-            collections.OrderedDict with key-value pairs: {"mAP(0.50, 11point)":`mean average precision`}.
			
 
				+            collections.OrderedDict with key-value pairs: 
			
 
				+                {"mAP(0.50, 11point)":`mean average precision`}.
			
 
				         """
			
 
				 
			
 
				         if metric is None:
			
 
				             if not hasattr(self, 'metric'):
			
 
				-                if eval_dataset.__class__.__name__ == 'VOCDetection':
			
 
				+                if eval_dataset.__class__.__name__ == 'VOCDetDataset':
			
 
				                     self.metric = 'voc'
			
 
				-                elif eval_dataset.__class__.__name__ == 'CocoDetection':
			
 
				+                elif eval_dataset.__class__.__name__ == 'COCODetDataset':
			
 
				                     self.metric = 'coco'
			
 
				         else:
			
 
				             assert metric.lower() in ['coco', 'voc'], \
			
 
				-                "Evaluation metric {} is not supported, please choose form 'COCO' and 'VOC'"
			
 
				+                "Evaluation metric {} is not supported. Please choose from 'COCO' and 'VOC'."
			
 
				             self.metric = metric.lower()
			
 
				 
			
 
				         if self.metric == 'voc':
			
@@ -506,24 +547,32 @@ class BaseDetector(BaseModel):
 
				     def predict(self, img_file, transforms=None):
			
 
				         """
			
 
				         Do inference.
			
 
				+
			
 
				         Args:
			
 
				-            img_file(list[np.ndarray | str] | str | np.ndarray):
			
 
				-                Image path or decoded image data, which also could constitute a list,meaning all images to be 
			
 
				+            img_file (list[np.ndarray|str] | str | np.ndarray): Image path or decoded 
			
 
				+                image data, which also could constitute a list, meaning all images to be 
			
 
				                 predicted as a mini-batch.
			
 
				-            transforms(paddlers.transforms.Compose or None, optional):
			
 
				-                Transforms for inputs. If None, the transforms for evaluation process will be used. Defaults to None.
			
 
				+            transforms (paddlers.transforms.Compose|None, optional): Transforms for 
			
 
				+                inputs. If None, the transforms for evaluation process  will be used. 
			
 
				+                Defaults to None.
			
 
				+
			
 
				         Returns:
			
 
				-            If img_file is a string or np.array, the result is a list of dict with key-value pairs:
			
 
				-            {"category_id": `category_id`, "category": `category`, "bbox": `[x, y, w, h]`, "score": `score`}.
			
 
				-            If img_file is a list, the result is a list composed of dicts with the corresponding fields:
			
 
				-            category_id(int): the predicted category ID. 0 represents the first category in the dataset, and so on.
			
 
				-            category(str): category name
			
 
				-            bbox(list): bounding box in [x, y, w, h] format
			
 
				-            score(str): confidence
			
 
				-            mask(dict): Only for instance segmentation task. Mask of the object in RLE format
			
 
				+            If `img_file` is a string or np.array, the result is a list of dict with 
			
 
				+                key-value pairs:
			
 
				+                {"category_id": `category_id`, "category": `category`, "bbox": `[x, y, w, h]`, "score": `score`}.
			
 
				+            If `img_file` is a list, the result is a list composed of dicts with the 
			
 
				+                corresponding fields:
			
 
				+                category_id(int): the predicted category ID. 0 represents the first 
			
 
				+                    category in the dataset, and so on.
			
 
				+                category(str): category name
			
 
				+                bbox(list): bounding box in [x, y, w, h] format
			
 
				+                score(str): confidence
			
 
				+                mask(dict): Only for instance segmentation task. Mask of the object in 
			
 
				+                    RLE format
			
 
				         """
			
 
				+
			
 
				         if transforms is None and not hasattr(self, 'test_transforms'):
			
 
				-            raise Exception("transforms need to be defined, now is None.")
			
 
				+            raise ValueError("transforms need to be defined, now is None.")
			
 
				         if transforms is None:
			
 
				             transforms = self.test_transforms
			
 
				         if isinstance(img_file, (str, np.ndarray)):
			
@@ -649,7 +698,7 @@ class PicoDet(BaseDetector):
 
				         }:
			
 
				             raise ValueError(
			
 
				                 "backbone: {} is not supported. Please choose one of "
			
 
				-                "('ESNet_s', 'ESNet_m', 'ESNet_l', 'LCNet', 'MobileNetV3', 'ResNet18_vd')".
			
 
				+                "{'ESNet_s', 'ESNet_m', 'ESNet_l', 'LCNet', 'MobileNetV3', 'ResNet18_vd'}.".
			
 
				                 format(backbone))
			
 
				         self.backbone_name = backbone
			
 
				         if params.get('with_net', True):
			
@@ -772,7 +821,7 @@ class PicoDet(BaseDetector):
 
				         for i, op in enumerate(transforms.transforms):
			
 
				             if isinstance(op, (BatchRandomResize, BatchRandomResizeByShort)):
			
 
				                 if mode != 'train':
			
 
				-                    raise Exception(
			
 
				+                    raise ValueError(
			
 
				                         "{} cannot be present in the {} transforms. ".format(
			
 
				                             op.__class__.__name__, mode) +
			
 
				                         "Please check the {} transforms.".format(mode))
			
@@ -851,34 +900,51 @@ class PicoDet(BaseDetector):
 
				               resume_checkpoint=None):
			
 
				         """
			
 
				         Train the model.
			
 
				+
			
 
				         Args:
			
 
				-            num_epochs(int): The number of epochs.
			
 
				-            train_dataset(paddlers.dataset): Training dataset.
			
 
				-            train_batch_size(int, optional): Total batch size among all cards used in training. Defaults to 64.
			
 
				-            eval_dataset(paddlers.dataset, optional):
			
 
				-                Evaluation dataset. If None, the model will not be evaluated during training process. Defaults to None.
			
 
				-            optimizer(paddle.optimizer.Optimizer or None, optional):
			
 
				-                Optimizer used for training. If None, a default optimizer is used. Defaults to None.
			
 
				-            save_interval_epochs(int, optional): Epoch interval for saving the model. Defaults to 1.
			
 
				-            log_interval_steps(int, optional): Step interval for printing training information. Defaults to 10.
			
 
				-            save_dir(str, optional): Directory to save the model. Defaults to 'output'.
			
 
				-            pretrain_weights(str or None, optional):
			
 
				-                None or name/path of pretrained weights. If None, no pretrained weights will be loaded. Defaults to 'IMAGENET'.
			
 
				-            learning_rate(float, optional): Learning rate for training. Defaults to .001.
			
 
				-            warmup_steps(int, optional): The number of steps of warm-up training. Defaults to 0.
			
 
				-            warmup_start_lr(float, optional): Start learning rate of warm-up training. Defaults to 0..
			
 
				-            lr_decay_epochs(list or tuple, optional): Epoch milestones for learning rate decay. Defaults to (216, 243).
			
 
				-            lr_decay_gamma(float, optional): Gamma coefficient of learning rate decay. Defaults to .1.
			
 
				-            metric({'VOC', 'COCO', None}, optional):
			
 
				-                Evaluation metric. If None, determine the metric according to the dataset format. Defaults to None.
			
 
				-            use_ema(bool, optional): Whether to use exponential moving average strategy. Defaults to False.
			
 
				-            early_stop(bool, optional): Whether to adopt early stop strategy. Defaults to False.
			
 
				-            early_stop_patience(int, optional): Early stop patience. Defaults to 5.
			
 
				-            use_vdl(bool, optional): Whether to use VisualDL to monitor the training process. Defaults to True.
			
 
				-            resume_checkpoint(str or None, optional): The path of the checkpoint to resume training from.
			
 
				-                If None, no training checkpoint will be resumed. At most one of `resume_checkpoint` and
			
 
				-                `pretrain_weights` can be set simultaneously. Defaults to None.
			
 
				+            num_epochs (int): Number of epochs.
			
 
				+            train_dataset (paddlers.datasets.COCODetDataset|paddlers.datasets.VOCDetDataset): 
			
 
				+                Training dataset.
			
 
				+            train_batch_size (int, optional): Total batch size among all cards used in 
			
 
				+                training. Defaults to 64.
			
 
				+            eval_dataset (paddlers.datasets.COCODetDataset|paddlers.datasets.VOCDetDataset, optional): 
			
 
				+                Evaluation dataset. If None, the model will not be evaluated during training 
			
 
				+                process. Defaults to None.
			
 
				+            optimizer (paddle.optimizer.Optimizer|None, optional): Optimizer used for 
			
 
				+                training. If None, a default optimizer will be used. Defaults to None.
			
 
				+            save_interval_epochs (int, optional): Epoch interval for saving the model. 
			
 
				+                Defaults to 1.
			
 
				+            log_interval_steps (int, optional): Step interval for printing training 
			
 
				+                information. Defaults to 10.
			
 
				+            save_dir (str, optional): Directory to save the model. Defaults to 'output'.
			
 
				+            pretrain_weights (str|None, optional): None or name/path of pretrained 
			
 
				+                weights. If None, no pretrained weights will be loaded. 
			
 
				+                Defaults to 'IMAGENET'.
			
 
				+            learning_rate (float, optional): Learning rate for training. Defaults to .001.
			
 
				+            warmup_steps (int, optional): Number of steps of warm-up training. 
			
 
				+                Defaults to 0.
			
 
				+            warmup_start_lr (float, optional): Start learning rate of warm-up training. 
			
 
				+                Defaults to 0..
			
 
				+            lr_decay_epochs (list|tuple, optional): Epoch milestones for learning 
			
 
				+                rate decay. Defaults to (216, 243).
			
 
				+            lr_decay_gamma (float, optional): Gamma coefficient of learning rate decay. 
			
 
				+                Defaults to .1.
			
 
				+            metric (str|None, optional): Evaluation metric. Choices are {'VOC', 'COCO', None}. 
			
 
				+                If None, determine the metric according to the  dataset format. 
			
 
				+                Defaults to None.
			
 
				+            use_ema (bool, optional): Whether to use exponential moving average 
			
 
				+                strategy. Defaults to False.
			
 
				+            early_stop (bool, optional): Whether to adopt early stop strategy. 
			
 
				+                Defaults to False.
			
 
				+            early_stop_patience (int, optional): Early stop patience. Defaults to 5.
			
 
				+            use_vdl(bool, optional): Whether to use VisualDL to monitor the training 
			
 
				+                process. Defaults to True.
			
 
				+            resume_checkpoint (str|None, optional): Path of the checkpoint to resume
			
 
				+                training from. If None, no training checkpoint will be resumed. At most
			
 
				+                Aone of `resume_checkpoint` and `pretrain_weights` can be set simultaneously.
			
 
				+                Defaults to None.
			
 
				         """
			
 
				+
			
 
				         if optimizer is None:
			
 
				             num_steps_each_epoch = len(train_dataset) // train_batch_size
			
 
				             optimizer = self.default_optimizer(
			
@@ -936,8 +1002,8 @@ class YOLOv3(BaseDetector):
 
				         }:
			
 
				             raise ValueError(
			
 
				                 "backbone: {} is not supported. Please choose one of "
			
 
				-                "('MobileNetV1', 'MobileNetV1_ssld', 'MobileNetV3', 'MobileNetV3_ssld', 'DarkNet53', "
			
 
				-                "'ResNet50_vd_dcn', 'ResNet34')".format(backbone))
			
 
				+                "{'MobileNetV1', 'MobileNetV1_ssld', 'MobileNetV3', 'MobileNetV3_ssld', 'DarkNet53', "
			
 
				+                "'ResNet50_vd_dcn', 'ResNet34'}.".format(backbone))
			
 
				 
			
 
				         self.backbone_name = backbone
			
 
				         if params.get('with_net', True):
			
@@ -1030,7 +1096,7 @@ class YOLOv3(BaseDetector):
 
				         for i, op in enumerate(transforms.transforms):
			
 
				             if isinstance(op, (BatchRandomResize, BatchRandomResizeByShort)):
			
 
				                 if mode != 'train':
			
 
				-                    raise Exception(
			
 
				+                    raise ValueError(
			
 
				                         "{} cannot be present in the {} transforms. ".format(
			
 
				                             op.__class__.__name__, mode) +
			
 
				                         "Please check the {} transforms.".format(mode))
			
@@ -1089,8 +1155,8 @@ class FasterRCNN(BaseDetector):
 
				         }:
			
 
				             raise ValueError(
			
 
				                 "backbone: {} is not supported. Please choose one of "
			
 
				-                "('ResNet50', 'ResNet50_vd', 'ResNet50_vd_ssld', 'ResNet34', 'ResNet34_vd', "
			
 
				-                "'ResNet101', 'ResNet101_vd', 'HRNet_W18')".format(backbone))
			
 
				+                "{'ResNet50', 'ResNet50_vd', 'ResNet50_vd_ssld', 'ResNet34', 'ResNet34_vd', "
			
 
				+                "'ResNet101', 'ResNet101_vd', 'HRNet_W18'}.".format(backbone))
			
 
				         self.backbone_name = backbone
			
 
				 
			
 
				         if params.get('with_net', True):
			
@@ -1327,34 +1393,51 @@ class FasterRCNN(BaseDetector):
 
				               resume_checkpoint=None):
			
 
				         """
			
 
				         Train the model.
			
 
				+
			
 
				         Args:
			
 
				-            num_epochs(int): The number of epochs.
			
 
				-            train_dataset(paddlers.dataset): Training dataset.
			
 
				-            train_batch_size(int, optional): Total batch size among all cards used in training. Defaults to 64.
			
 
				-            eval_dataset(paddlers.dataset, optional):
			
 
				-                Evaluation dataset. If None, the model will not be evaluated during training process. Defaults to None.
			
 
				-            optimizer(paddle.optimizer.Optimizer or None, optional):
			
 
				-                Optimizer used for training. If None, a default optimizer is used. Defaults to None.
			
 
				-            save_interval_epochs(int, optional): Epoch interval for saving the model. Defaults to 1.
			
 
				-            log_interval_steps(int, optional): Step interval for printing training information. Defaults to 10.
			
 
				-            save_dir(str, optional): Directory to save the model. Defaults to 'output'.
			
 
				-            pretrain_weights(str or None, optional):
			
 
				-                None or name/path of pretrained weights. If None, no pretrained weights will be loaded. Defaults to 'IMAGENET'.
			
 
				-            learning_rate(float, optional): Learning rate for training. Defaults to .001.
			
 
				-            warmup_steps(int, optional): The number of steps of warm-up training. Defaults to 0.
			
 
				-            warmup_start_lr(float, optional): Start learning rate of warm-up training. Defaults to 0..
			
 
				-            lr_decay_epochs(list or tuple, optional): Epoch milestones for learning rate decay. Defaults to (216, 243).
			
 
				-            lr_decay_gamma(float, optional): Gamma coefficient of learning rate decay. Defaults to .1.
			
 
				-            metric({'VOC', 'COCO', None}, optional):
			
 
				-                Evaluation metric. If None, determine the metric according to the dataset format. Defaults to None.
			
 
				-            use_ema(bool, optional): Whether to use exponential moving average strategy. Defaults to False.
			
 
				-            early_stop(bool, optional): Whether to adopt early stop strategy. Defaults to False.
			
 
				-            early_stop_patience(int, optional): Early stop patience. Defaults to 5.
			
 
				-            use_vdl(bool, optional): Whether to use VisualDL to monitor the training process. Defaults to True.
			
 
				-            resume_checkpoint(str or None, optional): The path of the checkpoint to resume training from.
			
 
				-                If None, no training checkpoint will be resumed. At most one of `resume_checkpoint` and
			
 
				-                `pretrain_weights` can be set simultaneously. Defaults to None.
			
 
				+            num_epochs (int): Number of epochs.
			
 
				+            train_dataset (paddlers.datasets.COCODetDataset|paddlers.datasets.VOCDetDataset): 
			
 
				+                Training dataset.
			
 
				+            train_batch_size (int, optional): Total batch size among all cards used in 
			
 
				+                training. Defaults to 64.
			
 
				+            eval_dataset (paddlers.datasets.COCODetDataset|paddlers.datasets.VOCDetDataset, optional): 
			
 
				+                Evaluation dataset. If None, the model will not be evaluated during training 
			
 
				+                process. Defaults to None.
			
 
				+            optimizer (paddle.optimizer.Optimizer|None, optional): Optimizer used for 
			
 
				+                training. If None, a default optimizer will be used. Defaults to None.
			
 
				+            save_interval_epochs (int, optional): Epoch interval for saving the model. 
			
 
				+                Defaults to 1.
			
 
				+            log_interval_steps (int, optional): Step interval for printing training 
			
 
				+                information. Defaults to 10.
			
 
				+            save_dir (str, optional): Directory to save the model. Defaults to 'output'.
			
 
				+            pretrain_weights (str|None, optional): None or name/path of pretrained 
			
 
				+                weights. If None, no pretrained weights will be loaded. 
			
 
				+                Defaults to 'IMAGENET'.
			
 
				+            learning_rate (float, optional): Learning rate for training. Defaults to .001.
			
 
				+            warmup_steps (int, optional): Number of steps of warm-up training. 
			
 
				+                Defaults to 0.
			
 
				+            warmup_start_lr (float, optional): Start learning rate of warm-up training. 
			
 
				+                Defaults to 0..
			
 
				+            lr_decay_epochs (list|tuple, optional): Epoch milestones for learning 
			
 
				+                rate decay. Defaults to (216, 243).
			
 
				+            lr_decay_gamma (float, optional): Gamma coefficient of learning rate decay. 
			
 
				+                Defaults to .1.
			
 
				+            metric (str|None, optional): Evaluation metric. Choices are {'VOC', 'COCO', None}. 
			
 
				+                If None, determine the metric according to the  dataset format. 
			
 
				+                Defaults to None.
			
 
				+            use_ema (bool, optional): Whether to use exponential moving average 
			
 
				+                strategy. Defaults to False.
			
 
				+            early_stop (bool, optional): Whether to adopt early stop strategy. 
			
 
				+                Defaults to False.
			
 
				+            early_stop_patience (int, optional): Early stop patience. Defaults to 5.
			
 
				+            use_vdl(bool, optional): Whether to use VisualDL to monitor the training 
			
 
				+                process. Defaults to True.
			
 
				+            resume_checkpoint (str|None, optional): Path of the checkpoint to resume
			
 
				+                training from. If None, no training checkpoint will be resumed. At most
			
 
				+                Aone of `resume_checkpoint` and `pretrain_weights` can be set simultaneously.
			
 
				+                Defaults to None.
			
 
				         """
			
 
				+
			
 
				         if train_dataset.pos_num < len(train_dataset.file_list):
			
 
				             train_dataset.num_workers = 0
			
 
				         super(FasterRCNN, self).train(
			
@@ -1377,7 +1460,7 @@ class FasterRCNN(BaseDetector):
 
				         for i, op in enumerate(transforms.transforms):
			
 
				             if isinstance(op, (BatchRandomResize, BatchRandomResizeByShort)):
			
 
				                 if mode != 'train':
			
 
				-                    raise Exception(
			
 
				+                    raise ValueError(
			
 
				                         "{} cannot be present in the {} transforms. ".format(
			
 
				                             op.__class__.__name__, mode) +
			
 
				                         "Please check the {} transforms.".format(mode))
			
@@ -1456,7 +1539,7 @@ class PPYOLO(YOLOv3):
 
				         }:
			
 
				             raise ValueError(
			
 
				                 "backbone: {} is not supported. Please choose one of "
			
 
				-                "('ResNet50_vd_dcn', 'ResNet18_vd', 'MobileNetV3_large', 'MobileNetV3_small')".
			
 
				+                "{'ResNet50_vd_dcn', 'ResNet18_vd', 'MobileNetV3_large', 'MobileNetV3_small'}.".
			
 
				                 format(backbone))
			
 
				         self.backbone_name = backbone
			
 
				         self.downsample_ratios = [
			
@@ -1769,7 +1852,7 @@ class PPYOLOv2(YOLOv3):
 
				         if backbone not in {'ResNet50_vd_dcn', 'ResNet101_vd_dcn'}:
			
 
				             raise ValueError(
			
 
				                 "backbone: {} is not supported. Please choose one of "
			
 
				-                "('ResNet50_vd_dcn', 'ResNet101_vd_dcn')".format(backbone))
			
 
				+                "{'ResNet50_vd_dcn', 'ResNet101_vd_dcn'}.".format(backbone))
			
 
				         self.backbone_name = backbone
			
 
				         self.downsample_ratios = [32, 16, 8]
			
 
				 
			
@@ -1916,7 +1999,7 @@ class MaskRCNN(BaseDetector):
 
				         }:
			
 
				             raise ValueError(
			
 
				                 "backbone: {} is not supported. Please choose one of "
			
 
				-                "('ResNet50', 'ResNet50_vd', 'ResNet50_vd_ssld', 'ResNet101', 'ResNet101_vd')".
			
 
				+                "{'ResNet50', 'ResNet50_vd', 'ResNet50_vd_ssld', 'ResNet101', 'ResNet101_vd'}.".
			
 
				                 format(backbone))
			
 
				 
			
 
				         self.backbone_name = backbone + '_fpn' if with_fpn else backbone
			
@@ -2152,34 +2235,51 @@ class MaskRCNN(BaseDetector):
 
				               resume_checkpoint=None):
			
 
				         """
			
 
				         Train the model.
			
 
				+
			
 
				         Args:
			
 
				-            num_epochs(int): The number of epochs.
			
 
				-            train_dataset(paddlers.dataset): Training dataset.
			
 
				-            train_batch_size(int, optional): Total batch size among all cards used in training. Defaults to 64.
			
 
				-            eval_dataset(paddlers.dataset, optional):
			
 
				-                Evaluation dataset. If None, the model will not be evaluated during training process. Defaults to None.
			
 
				-            optimizer(paddle.optimizer.Optimizer or None, optional):
			
 
				-                Optimizer used for training. If None, a default optimizer is used. Defaults to None.
			
 
				-            save_interval_epochs(int, optional): Epoch interval for saving the model. Defaults to 1.
			
 
				-            log_interval_steps(int, optional): Step interval for printing training information. Defaults to 10.
			
 
				-            save_dir(str, optional): Directory to save the model. Defaults to 'output'.
			
 
				-            pretrain_weights(str or None, optional):
			
 
				-                None or name/path of pretrained weights. If None, no pretrained weights will be loaded. Defaults to 'IMAGENET'.
			
 
				-            learning_rate(float, optional): Learning rate for training. Defaults to .001.
			
 
				-            warmup_steps(int, optional): The number of steps of warm-up training. Defaults to 0.
			
 
				-            warmup_start_lr(float, optional): Start learning rate of warm-up training. Defaults to 0..
			
 
				-            lr_decay_epochs(list or tuple, optional): Epoch milestones for learning rate decay. Defaults to (216, 243).
			
 
				-            lr_decay_gamma(float, optional): Gamma coefficient of learning rate decay. Defaults to .1.
			
 
				-            metric({'VOC', 'COCO', None}, optional):
			
 
				-                Evaluation metric. If None, determine the metric according to the dataset format. Defaults to None.
			
 
				-            use_ema(bool, optional): Whether to use exponential moving average strategy. Defaults to False.
			
 
				-            early_stop(bool, optional): Whether to adopt early stop strategy. Defaults to False.
			
 
				-            early_stop_patience(int, optional): Early stop patience. Defaults to 5.
			
 
				-            use_vdl(bool, optional): Whether to use VisualDL to monitor the training process. Defaults to True.
			
 
				-            resume_checkpoint(str or None, optional): The path of the checkpoint to resume training from.
			
 
				-                If None, no training checkpoint will be resumed. At most one of `resume_checkpoint` and
			
 
				-                `pretrain_weights` can be set simultaneously. Defaults to None.
			
 
				+            num_epochs (int): Number of epochs.
			
 
				+            train_dataset (paddlers.datasets.COCODetDataset|paddlers.datasets.VOCDetDataset): 
			
 
				+                Training dataset.
			
 
				+            train_batch_size (int, optional): Total batch size among all cards used in 
			
 
				+                training. Defaults to 64.
			
 
				+            eval_dataset (paddlers.datasets.COCODetDataset|paddlers.datasets.VOCDetDataset, optional): 
			
 
				+                Evaluation dataset. If None, the model will not be evaluated during training 
			
 
				+                process. Defaults to None.
			
 
				+            optimizer (paddle.optimizer.Optimizer|None, optional): Optimizer used for 
			
 
				+                training. If None, a default optimizer will be used. Defaults to None.
			
 
				+            save_interval_epochs (int, optional): Epoch interval for saving the model. 
			
 
				+                Defaults to 1.
			
 
				+            log_interval_steps (int, optional): Step interval for printing training 
			
 
				+                information. Defaults to 10.
			
 
				+            save_dir (str, optional): Directory to save the model. Defaults to 'output'.
			
 
				+            pretrain_weights (str|None, optional): None or name/path of pretrained 
			
 
				+                weights. If None, no pretrained weights will be loaded. 
			
 
				+                Defaults to 'IMAGENET'.
			
 
				+            learning_rate (float, optional): Learning rate for training. Defaults to .001.
			
 
				+            warmup_steps (int, optional): Number of steps of warm-up training. 
			
 
				+                Defaults to 0.
			
 
				+            warmup_start_lr (float, optional): Start learning rate of warm-up training. 
			
 
				+                Defaults to 0..
			
 
				+            lr_decay_epochs (list|tuple, optional): Epoch milestones for learning 
			
 
				+                rate decay. Defaults to (216, 243).
			
 
				+            lr_decay_gamma (float, optional): Gamma coefficient of learning rate decay. 
			
 
				+                Defaults to .1.
			
 
				+            metric (str|None, optional): Evaluation metric. Choices are {'VOC', 'COCO', None}. 
			
 
				+                If None, determine the metric according to the  dataset format. 
			
 
				+                Defaults to None.
			
 
				+            use_ema (bool, optional): Whether to use exponential moving average 
			
 
				+                strategy. Defaults to False.
			
 
				+            early_stop (bool, optional): Whether to adopt early stop strategy. 
			
 
				+                Defaults to False.
			
 
				+            early_stop_patience (int, optional): Early stop patience. Defaults to 5.
			
 
				+            use_vdl(bool, optional): Whether to use VisualDL to monitor the training 
			
 
				+                process. Defaults to True.
			
 
				+            resume_checkpoint (str|None, optional): Path of the checkpoint to resume
			
 
				+                training from. If None, no training checkpoint will be resumed. At most
			
 
				+                Aone of `resume_checkpoint` and `pretrain_weights` can be set simultaneously.
			
 
				+                Defaults to None.
			
 
				         """
			
 
				+
			
 
				         if train_dataset.pos_num < len(train_dataset.file_list):
			
 
				             train_dataset.num_workers = 0
			
 
				         super(MaskRCNN, self).train(
			
@@ -2202,7 +2302,7 @@ class MaskRCNN(BaseDetector):
 
				         for i, op in enumerate(transforms.transforms):
			
 
				             if isinstance(op, (BatchRandomResize, BatchRandomResizeByShort)):
			
 
				                 if mode != 'train':
			
 
				-                    raise Exception(
			
 
				+                    raise ValueError(
			
 
				                         "{} cannot be present in the {} transforms. ".format(
			
 
				                             op.__class__.__name__, mode) +
			
 
				                         "Please check the {} transforms.".format(mode))
			
--- a/paddlers/tasks/segmenter.py
+++ b/paddlers/tasks/segmenter.py
@@ -228,29 +228,38 @@ class BaseSegmenter(BaseModel):
 
				               resume_checkpoint=None):
			
 
				         """
			
 
				         Train the model.
			
 
				-        Args:
			
 
				-            num_epochs(int): The number of epochs.
			
 
				-            train_dataset(paddlers.dataset): Training dataset.
			
 
				-            train_batch_size(int, optional): Total batch size among all cards used in training. Defaults to 2.
			
 
				-            eval_dataset(paddlers.dataset, optional):
			
 
				-                Evaluation dataset. If None, the model will not be evaluated furing training process. Defaults to None.
			
 
				-            optimizer(paddle.optimizer.Optimizer or None, optional):
			
 
				-                Optimizer used in training. If None, a default optimizer is used. Defaults to None.
			
 
				-            save_interval_epochs(int, optional): Epoch interval for saving the model. Defaults to 1.
			
 
				-            log_interval_steps(int, optional): Step interval for printing training information. Defaults to 10.
			
 
				-            save_dir(str, optional): Directory to save the model. Defaults to 'output'.
			
 
				-            pretrain_weights(str or None, optional):
			
 
				-                None or name/path of pretrained weights. If None, no pretrained weights will be loaded. Defaults to 'CITYSCAPES'.
			
 
				-            learning_rate(float, optional): Learning rate for training. Defaults to .025.
			
 
				-            lr_decay_power(float, optional): Learning decay power. Defaults to .9.
			
 
				-            early_stop(bool, optional): Whether to adopt early stop strategy. Defaults to False.
			
 
				-            early_stop_patience(int, optional): Early stop patience. Defaults to 5.
			
 
				-            use_vdl(bool, optional): Whether to use VisualDL to monitor the training process. Defaults to True.
			
 
				-            resume_checkpoint(str or None, optional): The path of the checkpoint to resume training from.
			
 
				-                If None, no training checkpoint will be resumed. At most one of `resume_checkpoint` and
			
 
				-                `pretrain_weights` can be set simultaneously. Defaults to None.
			
 
				 
			
 
				+        Args:
			
 
				+            num_epochs (int): Number of epochs.
			
 
				+            train_dataset (paddlers.datasets.SegDataset): Training dataset.
			
 
				+            train_batch_size (int, optional): Total batch size among all cards used in 
			
 
				+                training. Defaults to 2.
			
 
				+            eval_dataset (paddlers.datasets.SegDataset|None, optional): Evaluation dataset. 
			
 
				+                If None, the model will not be evaluated during training process. 
			
 
				+                Defaults to None.
			
 
				+            optimizer (paddle.optimizer.Optimizer|None, optional): Optimizer used in 
			
 
				+                training. If None, a default optimizer will be used. Defaults to None.
			
 
				+            save_interval_epochs (int, optional): Epoch interval for saving the model. 
			
 
				+                Defaults to 1.
			
 
				+            log_interval_steps (int, optional): Step interval for printing training 
			
 
				+                information. Defaults to 2.
			
 
				+            save_dir (str, optional): Directory to save the model. Defaults to 'output'.
			
 
				+            pretrain_weights (str|None, optional): None or name/path of pretrained 
			
 
				+                weights. If None, no pretrained weights will be loaded. 
			
 
				+                Defaults to 'CITYSCAPES'.
			
 
				+            learning_rate (float, optional): Learning rate for training. Defaults to .025.
			
 
				+            lr_decay_power (float, optional): Learning decay power. Defaults to .9.
			
 
				+            early_stop (bool, optional): Whether to adopt early stop strategy. Defaults 
			
 
				+                to False.
			
 
				+            early_stop_patience (int, optional): Early stop patience. Defaults to 5.
			
 
				+            use_vdl (bool, optional): Whether to use VisualDL to monitor the training 
			
 
				+                process. Defaults to True.
			
 
				+            resume_checkpoint (str|None, optional): Path of the checkpoint to resume
			
 
				+                training from. If None, no training checkpoint will be resumed. At most
			
 
				+                Aone of `resume_checkpoint` and `pretrain_weights` can be set simultaneously.
			
 
				+                Defaults to None.
			
 
				         """
			
 
				+
			
 
				         if self.status == 'Infer':
			
 
				             logging.error(
			
 
				                 "Exported inference model does not support training.",
			
@@ -326,28 +335,37 @@ class BaseSegmenter(BaseModel):
 
				                           quant_config=None):
			
 
				         """
			
 
				         Quantization-aware training.
			
 
				-        Args:
			
 
				-            num_epochs(int): The number of epochs.
			
 
				-            train_dataset(paddlers.dataset): Training dataset.
			
 
				-            train_batch_size(int, optional): Total batch size among all cards used in training. Defaults to 2.
			
 
				-            eval_dataset(paddlers.dataset, optional):
			
 
				-                Evaluation dataset. If None, the model will not be evaluated furing training process. Defaults to None.
			
 
				-            optimizer(paddle.optimizer.Optimizer or None, optional):
			
 
				-                Optimizer used in training. If None, a default optimizer is used. Defaults to None.
			
 
				-            save_interval_epochs(int, optional): Epoch interval for saving the model. Defaults to 1.
			
 
				-            log_interval_steps(int, optional): Step interval for printing training information. Defaults to 10.
			
 
				-            save_dir(str, optional): Directory to save the model. Defaults to 'output'.
			
 
				-            learning_rate(float, optional): Learning rate for training. Defaults to .025.
			
 
				-            lr_decay_power(float, optional): Learning decay power. Defaults to .9.
			
 
				-            early_stop(bool, optional): Whether to adopt early stop strategy. Defaults to False.
			
 
				-            early_stop_patience(int, optional): Early stop patience. Defaults to 5.
			
 
				-            use_vdl(bool, optional): Whether to use VisualDL to monitor the training process. Defaults to True.
			
 
				-            quant_config(dict or None, optional): Quantization configuration. If None, a default rule of thumb
			
 
				-                configuration will be used. Defaults to None.
			
 
				-            resume_checkpoint(str or None, optional): The path of the checkpoint to resume quantization-aware training
			
 
				-                from. If None, no training checkpoint will be resumed. Defaults to None.
			
 
				 
			
 
				+        Args:
			
 
				+            num_epochs (int): Number of epochs.
			
 
				+            train_dataset (paddlers.datasets.SegDataset): Training dataset.
			
 
				+            train_batch_size (int, optional): Total batch size among all cards used in 
			
 
				+                training. Defaults to 2.
			
 
				+            eval_dataset (paddlers.datasets.SegDataset|None, optional): Evaluation dataset.
			
 
				+                If None, the model will not be evaluated during training process. 
			
 
				+                Defaults to None.
			
 
				+            optimizer (paddle.optimizer.Optimizer|None, optional): Optimizer used in 
			
 
				+                training. If None, a default optimizer will be used. Defaults to None.
			
 
				+            save_interval_epochs (int, optional): Epoch interval for saving the model. 
			
 
				+                Defaults to 1.
			
 
				+            log_interval_steps (int, optional): Step interval for printing training 
			
 
				+                information. Defaults to 2.
			
 
				+            save_dir (str, optional): Directory to save the model. Defaults to 'output'.
			
 
				+            learning_rate (float, optional): Learning rate for training. 
			
 
				+                Defaults to .0001.
			
 
				+            lr_decay_power (float, optional): Learning decay power. Defaults to .9.
			
 
				+            early_stop (bool, optional): Whether to adopt early stop strategy. 
			
 
				+                Defaults to False.
			
 
				+            early_stop_patience (int, optional): Early stop patience. Defaults to 5.
			
 
				+            use_vdl (bool, optional): Whether to use VisualDL to monitor the training 
			
 
				+                process. Defaults to True.
			
 
				+            quant_config (dict|None, optional): Quantization configuration. If None, 
			
 
				+                a default rule of thumb configuration will be used. Defaults to None.
			
 
				+            resume_checkpoint (str|None, optional): Path of the checkpoint to resume
			
 
				+                quantization-aware training from. If None, no training checkpoint will
			
 
				+                be resumed. Defaults to None.
			
 
				         """
			
 
				+
			
 
				         self._prepare_qat(quant_config)
			
 
				         self.train(
			
 
				             num_epochs=num_epochs,
			
@@ -369,10 +387,13 @@ class BaseSegmenter(BaseModel):
 
				     def evaluate(self, eval_dataset, batch_size=1, return_details=False):
			
 
				         """
			
 
				         Evaluate the model.
			
 
				+
			
 
				         Args:
			
 
				-            eval_dataset(paddlers.dataset): Evaluation dataset.
			
 
				-            batch_size(int, optional): Total batch size among all cards used for evaluation. Defaults to 1.
			
 
				-            return_details(bool, optional): Whether to return evaluation details. Defaults to False.
			
 
				+            eval_dataset (paddlers.datasets.SegDataset): Evaluation dataset.
			
 
				+            batch_size (int, optional): Total batch size among all cards used for 
			
 
				+                evaluation. Defaults to 1.
			
 
				+            return_details (bool, optional): Whether to return evaluation details. 
			
 
				+                Defaults to False.
			
 
				 
			
 
				         Returns:
			
 
				             collections.OrderedDict with key-value pairs:
			
@@ -384,6 +405,7 @@ class BaseSegmenter(BaseModel):
 
				                  "category_F1-score": `F1 score`}.
			
 
				 
			
 
				         """
			
 
				+
			
 
				         self._check_transforms(eval_dataset.transforms, 'eval')
			
 
				 
			
 
				         self.net.eval()
			
@@ -477,24 +499,27 @@ class BaseSegmenter(BaseModel):
 
				     def predict(self, img_file, transforms=None):
			
 
				         """
			
 
				         Do inference.
			
 
				+
			
 
				         Args:
			
 
				-            Args:
			
 
				-            img_file(list[np.ndarray | str] | str | np.ndarray):
			
 
				-                Image path or decoded image data, which also could constitute a list,meaning all images to be 
			
 
				+            img_file (list[np.ndarray|str] | str | np.ndarray): Image path or decoded 
			
 
				+                image data, which also could constitute a list, meaning all images to be 
			
 
				                 predicted as a mini-batch.
			
 
				-            transforms(paddlers.transforms.Compose or None, optional):
			
 
				-                Transforms for inputs. If None, the transforms for evaluation process will be used. Defaults to None.
			
 
				+            transforms (paddlers.transforms.Compose|None, optional): Transforms for 
			
 
				+                inputs. If None, the transforms for evaluation process will be used. 
			
 
				+                Defaults to None.
			
 
				 
			
 
				         Returns:
			
 
				-            If img_file is a string or np.array, the result is a dict with key-value pairs:
			
 
				-            {"label map": `label map`, "score_map": `score map`}.
			
 
				-            If img_file is a list, the result is a list composed of dicts with the corresponding fields:
			
 
				-            label_map(np.ndarray): the predicted label map (HW)
			
 
				-            score_map(np.ndarray): the prediction score map (HWC)
			
 
				-
			
 
				+            If `img_file` is a string or np.array, the result is a dict with key-value 
			
 
				+                pairs:
			
 
				+                {"label map": `label map`, "score_map": `score map`}.
			
 
				+            If `img_file` is a list, the result is a list composed of dicts with the 
			
 
				+                corresponding fields:
			
 
				+                label_map (np.ndarray): the predicted label map (HW)
			
 
				+                score_map (np.ndarray): the prediction score map (HWC)
			
 
				         """
			
 
				+
			
 
				         if transforms is None and not hasattr(self, 'test_transforms'):
			
 
				-            raise Exception("transforms need to be defined, now is None.")
			
 
				+            raise ValueError("transforms need to be defined, now is None.")
			
 
				         if transforms is None:
			
 
				             transforms = self.test_transforms
			
 
				         if isinstance(img_file, (str, np.ndarray)):
			
@@ -528,19 +553,19 @@ class BaseSegmenter(BaseModel):
 
				                        transforms=None):
			
 
				         """
			
 
				         Do inference.
			
 
				+
			
 
				         Args:
			
 
				-            Args:
			
 
				-            img_file(str):
			
 
				-                Image path.
			
 
				-            save_dir(str):
			
 
				-                Directory that contains saved geotiff file.
			
 
				-            block_size(list[int] | tuple[int] | int):
			
 
				+            img_file (str): Image path.
			
 
				+            save_dir (str): Directory that contains saved geotiff file.
			
 
				+            block_size (list[int] | tuple[int] | int):
			
 
				                 Size of block.
			
 
				-            overlap(list[int] | tuple[int] | int, optional):
			
 
				+            overlap (list[int] | tuple[int] | int, optional):
			
 
				                 Overlap between two blocks. Defaults to 36.
			
 
				-            transforms(paddlers.transforms.Compose or None, optional):
			
 
				-                Transforms for inputs. If None, the transforms for evaluation process will be used. Defaults to None.
			
 
				+            transforms (paddlers.transforms.Compose|None, optional): Transforms for 
			
 
				+                inputs. If None, the transforms for evaluation process will be used. 
			
 
				+                Defaults to None.
			
 
				         """
			
 
				+
			
 
				         try:
			
 
				             from osgeo import gdal
			
 
				         except:
			
@@ -790,7 +815,7 @@ class DeepLabV3P(BaseSegmenter):
 
				         if backbone not in ['ResNet50_vd', 'ResNet101_vd']:
			
 
				             raise ValueError(
			
 
				                 "backbone: {} is not supported. Please choose one of "
			
 
				-                "('ResNet50_vd', 'ResNet101_vd')".format(backbone))
			
 
				+                "{'ResNet50_vd', 'ResNet101_vd'}.".format(backbone))
			
 
				         if params.get('with_net', True):
			
 
				             with DisablePrint():
			
 
				                 backbone = getattr(paddleseg.models, backbone)(
			
@@ -834,8 +859,8 @@ class HRNet(BaseSegmenter):
 
				                  **params):
			
 
				         if width not in (18, 48):
			
 
				             raise ValueError(
			
 
				-                "width={} is not supported, please choose from [18, 48]".format(
			
 
				-                    width))
			
 
				+                "width={} is not supported, please choose from {18, 48}.".
			
 
				+                format(width))
			
 
				         self.backbone_name = 'HRNet_W{}'.format(width)
			
 
				         if params.get('with_net', True):
			
 
				             with DisablePrint():
			
--- a/paddlers/tasks/utils/det_metrics/coco_utils.py
+++ b/paddlers/tasks/utils/det_metrics/coco_utils.py
@@ -71,13 +71,13 @@ def cocoapi_eval(anns,
 
				                  classwise=False):
			
 
				     """
			
 
				     Args:
			
 
				-        anns: Evaluation result.
			
 
				-        style (str): COCOeval style, can be `bbox` , `segm` and `proposal`.
			
 
				-        coco_gt (str): Whether to load COCOAPI through anno_file,
			
 
				+        anns (list): Evaluation result.
			
 
				+        style (str): COCOeval style. Choices are 'bbox', 'segm' and 'proposal'.
			
 
				+        coco_gt (str, optional): Whether to load COCOAPI through anno_file,
			
 
				                  eg: coco_gt = COCO(anno_file)
			
 
				-        anno_file (str): COCO annotations file.
			
 
				-        max_dets (tuple): COCO evaluation maxDets.
			
 
				-        classwise (bool): Whether per-category AP and draw P-R Curve or not.
			
 
				+        anno_file (str, optional): COCO annotations file. Defaults to None.
			
 
				+        max_dets (tuple, optional): COCO evaluation maxDets. Defaults to (100, 300, 1000).
			
 
				+        classwise (bool, optional): Whether to calculate per-category statistics or not. Defaults to None.
			
 
				     """
			
 
				 
			
 
				     assert coco_gt is not None or anno_file is not None
			
@@ -148,12 +148,6 @@ def cocoapi_eval(anns,
 
				 
			
 
				 
			
 
				 def loadRes(coco_obj, anns):
			
 
				-    """
			
 
				-    Load result file and return a result api object.
			
 
				-    :param   resFile (str)     : file name of result file
			
 
				-    :return: res (obj)         : result api object
			
 
				-    """
			
 
				-
			
 
				     # This function has the same functionality as pycocotools.COCO.loadRes,
			
 
				     # except that the input anns is list of results rather than a json file.
			
 
				     # Refer to
			
@@ -294,7 +288,6 @@ def analyze_individual_category(k, cocoDt, cocoGt, catId, iou_type, areas=None):
 
				         int:
			
 
				         dict: 有关键字'ps_supercategory'和'ps_allcategory'。关键字'ps_supercategory'的键值是忽略亚类间
			
 
				             混淆时的准确率，关键字'ps_allcategory'的键值是忽略类别间混淆时的准确率。
			
 
				-
			
 
				     """
			
 
				 
			
 
				     # matplotlib.use() must be called *before* pylab, matplotlib.pyplot,
			
@@ -402,13 +395,13 @@ def coco_error_analysis(eval_details_file=None,
 
				                 pred_mask = eval_details['mask']
			
 
				             gt = eval_details['gt']
			
 
				     if gt is None or pred_bbox is None:
			
 
				-        raise Exception(
			
 
				-            "gt/pred_bbox/pred_mask is None now, please set right eval_details_file or gt/pred_bbox/pred_mask."
			
 
				+        raise ValueError(
			
 
				+            "gt/pred_bbox/pred_mask is None now. Please set right eval_details_file or gt/pred_bbox/pred_mask."
			
 
				         )
			
 
				     if pred_bbox is not None and len(pred_bbox) == 0:
			
 
				-        raise Exception("There is no predicted bbox.")
			
 
				+        raise ValueError("There is no predicted bbox.")
			
 
				     if pred_mask is not None and len(pred_mask) == 0:
			
 
				-        raise Exception("There is no predicted mask.")
			
 
				+        raise ValueError("There is no predicted mask.")
			
 
				 
			
 
				     def _analyze_results(cocoGt, cocoDt, res_type, out_dir):
			
 
				         """
			
@@ -474,4 +467,4 @@ def coco_error_analysis(eval_details_file=None,
 
				     if pred_mask is not None:
			
 
				         coco_dt = loadRes(coco_gt, pred_mask)
			
 
				         _analyze_results(coco_gt, coco_dt, res_type='segm', out_dir=save_dir)
			
 
				-    logging.info("The analysis figures are saved in {}".format(save_dir))
			
 
				+    logging.info("The analysis figures are saved in {}.".format(save_dir))
			
--- a/paddlers/tasks/utils/visualize.py
+++ b/paddlers/tasks/utils/visualize.py
@@ -50,11 +50,12 @@ def visualize_segmentation(image, result, weight=0.6, save_dir='./',
 
				     Convert segment result to color image, and save added image.
			
 
				 
			
 
				     Args:
			
 
				-        image: the path of origin image
			
 
				-        result: the predict result of image
			
 
				-        weight: the image weight of visual image, and the result weight is (1 - weight)
			
 
				-        save_dir: the directory for saving visual image
			
 
				-        color: the list of a BGR-mode color for each label.
			
 
				+        image (str): Path of original image.
			
 
				+        result (dict): Predicted results.
			
 
				+        weight (float, optional): Weight used to mix the original image with the predicted image.
			
 
				+            Defaults to 0.6.
			
 
				+        save_dir (str, optional): Directory for saving visualized image. Defaults to './'.
			
 
				+        color (list|None): None or list of BGR indices for each label. Defaults to None.
			
 
				     """
			
 
				 
			
 
				     label_map = result['label_map'].astype("uint8")
			
@@ -106,14 +107,15 @@ def visualize_segmentation(image, result, weight=0.6, save_dir='./',
 
				 
			
 
				 
			
 
				 def get_color_map_list(num_classes):
			
 
				-    """ 
			
 
				-    Returns the color map for visualizing the segmentation mask, which can support arbitrary number of classes.
			
 
				+    """
			
 
				+    Get the color map for visualizing a segmentation mask.
			
 
				+    This function supports arbitrary number of classes.
			
 
				 
			
 
				     Args:
			
 
				-        num_classes: Number of classes
			
 
				+        num_classes (int): Number of classes.
			
 
				 
			
 
				     Returns:
			
 
				-        The color map
			
 
				+        list: Color map.
			
 
				     """
			
 
				 
			
 
				     color_map = num_classes * [0, 0, 0]
			
@@ -130,10 +132,10 @@ def get_color_map_list(num_classes):
 
				     return color_map
			
 
				 
			
 
				 
			
 
				-# expand an array of boxes by a given scale.
			
 
				 def expand_boxes(boxes, scale):
			
 
				     """
			
 
				-        """
			
 
				+    Expand an array of boxes by a given scale.
			
 
				+    """
			
 
				     w_half = (boxes[:, 2] - boxes[:, 0]) * .5
			
 
				     h_half = (boxes[:, 3] - boxes[:, 1]) * .5
			
 
				     x_c = (boxes[:, 2] + boxes[:, 0]) * .5
			
@@ -175,7 +177,7 @@ def draw_bbox_mask(image, results, threshold=0.5, color_map=None):
 
				     else:
			
 
				         color_map = np.asarray(color_map)
			
 
				         if color_map.shape[0] != len(labels) or color_map.shape[1] != 3:
			
 
				-            raise Exception(
			
 
				+            raise ValueError(
			
 
				                 "The shape for color_map is required to be {}x3, but recieved shape is {}x{}.".
			
 
				                 format(len(labels), color_map.shape))
			
 
				         if np.max(color_map) > 255 or np.min(color_map) < 0:
			
@@ -203,11 +205,11 @@ def draw_bbox_mask(image, results, threshold=0.5, color_map=None):
 
				         ymax = ymin + h
			
 
				 
			
 
				         color = tuple(map(int, color_map[labels.index(cname)]))
			
 
				-        # draw bbox
			
 
				+        # Draw bbox
			
 
				         image = cv2.rectangle(image, (xmin, ymin), (xmax, ymax), color,
			
 
				                               linewidth)
			
 
				 
			
 
				-        # draw mask
			
 
				+        # Draw mask
			
 
				         if 'mask' in dt:
			
 
				             mask = dt['mask'] * 255
			
 
				             image = image.astype('float32')
			
@@ -230,7 +232,7 @@ def draw_bbox_mask(image, results, threshold=0.5, color_map=None):
 
				                 thickness=1,
			
 
				                 lineType=cv2.LINE_AA)
			
 
				 
			
 
				-        # draw label
			
 
				+        # Draw label
			
 
				         text_pos = (xmin, ymin)
			
 
				         instance_area = w * h
			
 
				         if (instance_area < _SMALL_OBJECT_AREA_THRESH or h < 40):
			
@@ -279,13 +281,13 @@ def draw_pr_curve(eval_details_file=None,
 
				                 pred_mask = eval_details['mask']
			
 
				             gt = eval_details['gt']
			
 
				     if gt is None or pred_bbox is None:
			
 
				-        raise Exception(
			
 
				+        raise ValueError(
			
 
				             "gt/pred_bbox/pred_mask is None now, please set right eval_details_file or gt/pred_bbox/pred_mask."
			
 
				         )
			
 
				     if pred_bbox is not None and len(pred_bbox) == 0:
			
 
				-        raise Exception("There is no predicted bbox.")
			
 
				+        raise ValueError("There is no predicted bbox.")
			
 
				     if pred_mask is not None and len(pred_mask) == 0:
			
 
				-        raise Exception("There is no predicted mask.")
			
 
				+        raise ValueError("There is no predicted mask.")
			
 
				     import matplotlib
			
 
				     matplotlib.use('Agg')
			
 
				     import matplotlib.pyplot as plt
			
@@ -297,7 +299,8 @@ def draw_pr_curve(eval_details_file=None,
 
				 
			
 
				     def _summarize(coco_gt, ap=1, iouThr=None, areaRng='all', maxDets=100):
			
 
				         """
			
 
				-        This function has the same functionality as _summarize() in pycocotools.COCOeval.summarize().
			
 
				+        This function has the same functionality as _summarize() in 
			
 
				+            pycocotools.COCOeval.summarize().
			
 
				 
			
 
				         Refer to
			
 
				         https://github.com/cocodataset/cocoapi/blob/8c9bcc3cf640524c4c20a9c40e89cb6a2f2fa0e9/PythonAPI/pycocotools/cocoeval.py#L427,
			
@@ -336,7 +339,7 @@ def draw_pr_curve(eval_details_file=None,
 
				         stats = _summarize(coco_eval, iouThr=iou_thresh)
			
 
				         catIds = coco_gt.getCatIds()
			
 
				         if len(catIds) != coco_eval.eval['precision'].shape[2]:
			
 
				-            raise Exception(
			
 
				+            raise ValueError(
			
 
				                 "The category number must be same as the third dimension of precisions."
			
 
				             )
			
 
				         x = np.arange(0.0, 1.01, 0.01)
			
--- a/paddlers/tools/yolo_cluster.py
+++ b/paddlers/tools/yolo_cluster.py
@@ -30,9 +30,9 @@ class BaseAnchorCluster(object):
 
				         Base Anchor Cluster
			
 
				         
			
 
				         Args:
			
 
				-            num_anchors (int): number of clusters
			
 
				-            cache (bool): whether using cache
			
 
				-            cache_path (str): cache directory path
			
 
				+            num_anchors (int): Number of clusters.
			
 
				+            cache (bool): Whether to use cache.
			
 
				+            cache_path (str): Cache directory path.
			
 
				         """
			
 
				         super(BaseAnchorCluster, self).__init__()
			
 
				         self.num_anchors = num_anchors
			
@@ -99,14 +99,15 @@ class YOLOAnchorCluster(BaseAnchorCluster):
 
				             https://github.com/ultralytics/yolov5/blob/master/utils/autoanchor.py
			
 
				 
			
 
				         Args:
			
 
				-            num_anchors (int): number of clusters
			
 
				-            dataset (DataSet): DataSet instance, VOC or COCO
			
 
				-            image_size (list or int): [h, w], being an int means image height and image width are the same.
			
 
				-            cache (bool): whether using cache. Defaults to True.
			
 
				-            cache_path (str or None, optional): cache directory path. If None, use `data_dir` of dataset. Defaults to None.
			
 
				-            iters (int, optional): iters of kmeans algorithm. Defaults to 300.
			
 
				-            gen_iters (int, optional): iters of genetic algorithm. Defaults to 1000.
			
 
				-            thresh (float, optional): anchor scale threshold. Defaults to 0.25.
			
 
				+            num_anchors (int): Number of clusters.
			
 
				+            dataset (paddlers.datasets.COCODetDataset|paddlers.datasets.VOCDetDataset): Dataset instance.
			
 
				+            image_size (list[int] | int): [h, w] or an int value that corresponds to the shape [image_size, image_size].
			
 
				+            cache (bool, optional): Whether to use cache. Defaults to True.
			
 
				+            cache_path (str|None, optional): Path of cache directory. If None, use `dataset.data_dir`. 
			
 
				+                Defaults to None.
			
 
				+            iters (int, optional): Iterations of k-means algorithm. Defaults to 300.
			
 
				+            gen_iters (int, optional): Iterations of genetic algorithm. Defaults to 1000.
			
 
				+            thresh (float, optional): Anchor scale threshold. Defaults to 0.25.
			
 
				         """
			
 
				         self.dataset = dataset
			
 
				         if cache_path is None:
			
--- a/paddlers/transforms/__init__.py
+++ b/paddlers/transforms/__init__.py
@@ -29,14 +29,16 @@ def decode_image(im_path,
 
				     Decode an image.
			
 
				     
			
 
				     Args:
			
 
				-        im_path (str): Path of the image to decode.
			
 
				-        to_rgb (bool, optional): If True, convert input image(s) from BGR format to RGB format. Defaults to True.
			
 
				-        to_uint8 (bool, optional): If True, quantize and convert decoded image(s) to uint8 type. Defaults to True.
			
 
				-        decode_bgr (bool, optional): If True, automatically interpret a non-geo image (e.g. jpeg images) as a BGR image. 
			
 
				-            Defaults to True.
			
 
				-        decode_sar (bool, optional): If True, automatically interpret a two-channel geo image (e.g. geotiff images) as a 
			
 
				-            SAR image, set this argument to True. Defaults to True.
			
 
				-
			
 
				+        to_rgb (bool, optional): If True, convert input image(s) from BGR format to 
			
 
				+            RGB format. Defaults to True.
			
 
				+        to_uint8 (bool, optional): If True, quantize and convert decoded image(s) to 
			
 
				+            uint8 type. Defaults to True.
			
 
				+        decode_bgr (bool, optional): If True, automatically interpret a non-geo 
			
 
				+            image (e.g. jpeg images) as a BGR image. Defaults to True.
			
 
				+        decode_sar (bool, optional): If True, automatically interpret a two-channel 
			
 
				+            geo image (e.g. geotiff images) as a SAR image, set this argument to 
			
 
				+            True. Defaults to True.
			
 
				+    
			
 
				     Returns:
			
 
				         np.ndarray: Decoded image.
			
 
				     """
			
--- a/paddlers/transforms/batch_operators.py
+++ b/paddlers/transforms/batch_operators.py
@@ -72,17 +72,18 @@ class BatchCompose(Transform):
 
				 
			
 
				 class BatchRandomResize(Transform):
			
 
				     """
			
 
				-    Resize a batch of input to random sizes.
			
 
				+    Resize a batch of inputs to random sizes.
			
 
				 
			
 
				-    Attention: If interp is 'RANDOM', the interpolation method will be chose randomly.
			
 
				+    Attention: If `interp` is 'RANDOM', the interpolation method will be chosen randomly.
			
 
				 
			
 
				     Args:
			
 
				-        target_sizes (list[int] | list[list | tuple] | tuple[list | tuple]):
			
 
				-            Multiple target sizes, each target size is an int or list/tuple of length 2.
			
 
				-        interp ({'NEAREST', 'LINEAR', 'CUBIC', 'AREA', 'LANCZOS4', 'RANDOM'}, optional):
			
 
				-            Interpolation method of resize. Defaults to 'LINEAR'.
			
 
				+        target_sizes (list[int] | list[list|tuple] | tuple[list|tuple]):
			
 
				+            Multiple target sizes, each of which should be an int or list/tuple of length 2.
			
 
				+        interp (str, optional): Interpolation method for resizing image(s). One of 
			
 
				+            {'NEAREST', 'LINEAR', 'CUBIC', 'AREA', 'LANCZOS4', 'RANDOM'}. 
			
 
				+            Defaults to 'LINEAR'.
			
 
				     Raises:
			
 
				-        TypeError: Invalid type of target_size.
			
 
				+        TypeError: Invalid type of `target_size`.
			
 
				         ValueError: Invalid interpolation method.
			
 
				 
			
 
				     See Also:
			
@@ -111,23 +112,27 @@ class BatchRandomResize(Transform):
 
				 
			
 
				 
			
 
				 class BatchRandomResizeByShort(Transform):
			
 
				-    """Resize a batch of input to random sizes with keeping the aspect ratio.
			
 
				+    """
			
 
				+    Resize a batch of inputs to random sizes while keeping the aspect ratio.
			
 
				 
			
 
				-    Attention: If interp is 'RANDOM', the interpolation method will be chose randomly.
			
 
				+    Attention: If `interp` is 'RANDOM', the interpolation method will be chosen randomly.
			
 
				 
			
 
				     Args:
			
 
				-        short_sizes (list[int] | tuple[int]): Target sizes of the shorter side of the image(s).
			
 
				-        max_size (int, optional): The upper bound of longer side of the image(s).
			
 
				-            If max_size is -1, no upper bound is applied. Defaults to -1.
			
 
				-        interp ({'NEAREST', 'LINEAR', 'CUBIC', 'AREA', 'LANCZOS4', 'RANDOM'}, optional):
			
 
				-            Interpolation method of resize. Defaults to 'LINEAR'.
			
 
				+        short_sizes (list[int] | tuple[int]): Target sizes of the shorter side of 
			
 
				+            the image(s).
			
 
				+        max_size (int, optional): Upper bound of longer side of the image(s).
			
 
				+            If `max_size` is -1, no upper bound will be applied. Defaults to -1.
			
 
				+        interp (str, optional): Interpolation method for resizing image(s). One of 
			
 
				+            {'NEAREST', 'LINEAR', 'CUBIC', 'AREA', 'LANCZOS4', 'RANDOM'}. 
			
 
				+            Defaults to 'LINEAR'.
			
 
				 
			
 
				     Raises:
			
 
				-        TypeError: Invalid type of target_size.
			
 
				+        TypeError: Invalid type of `target_size`.
			
 
				         ValueError: Invalid interpolation method.
			
 
				 
			
 
				     See Also:
			
 
				-        RandomResizeByShort: Resize input to random sizes with keeping the aspect ratio.
			
 
				+        RandomResizeByShort: Resize input to random sizes while keeping the aspect 
			
 
				+            ratio.
			
 
				     """
			
 
				 
			
 
				     def __init__(self, short_sizes, max_size=-1, interp='NEAREST'):
			
@@ -180,7 +185,7 @@ class _BatchPad(Transform):
 
				 class _Gt2YoloTarget(Transform):
			
 
				     """
			
 
				     Generate YOLOv3 targets by groud truth data, this operator is only used in
			
 
				-    fine grained YOLOv3 loss mode
			
 
				+        fine grained YOLOv3 loss mode.
			
 
				     """
			
 
				 
			
 
				     def __init__(self,
			
--- a/paddlers/transforms/functions.py
+++ b/paddlers/transforms/functions.py
@@ -58,75 +58,73 @@ def center_crop(im, crop_size=224):
 
				 # region flip
			
 
				 def img_flip(im, method=0):
			
 
				     """
			
 
				-    flip image in different ways, this function provides 5 method to filp
			
 
				-    this function can be applied to 2D or 3D images
			
 
				+    Flip an image. 
			
 
				+    This function provides 5 flipping methods and can be applied to 2D or 3D numpy arrays.
			
 
				 
			
 
				     Args:
			
 
				-        im(array): image array
			
 
				-        method(int or string): choose the flip method, it must be one of [
			
 
				-                                0, 1, 2, 3, 4, 'h', 'v', 'hv', 'rt2lb', 'lt2rb', 'dia', 'adia']
			
 
				-        0 or 'h': flipped in horizontal direction, which is the most frequently used method
			
 
				-        1 or 'v': flipped in vertical direction
			
 
				-        2 or 'hv': flipped in both horizontal diction and vertical direction
			
 
				-        3 or 'rt2lb' or 'dia': flipped around the diagonal,
			
 
				-                                which also can be thought as changing the RightTop part with LeftBottom part,
			
 
				-                                so it is called 'rt2lb' as well.
			
 
				-        4 or 'lt2rb' or 'adia': flipped around the anti-diagonal
			
 
				-                                    which also can be thought as changing the LeftTop part with RightBottom part,
			
 
				-                                    so it is called 'lt2rb' as well.
			
 
				+        im (np.ndarray): Input image.
			
 
				+        method (int|string): Flipping method. Must be one of [
			
 
				+                                0, 1, 2, 3, 4, 'h', 'v', 'hv', 'rt2lb', 'lt2rb', 
			
 
				+                                'dia', 'adia'].
			
 
				+            0 or 'h': flip the image in horizontal direction, which is the most frequently 
			
 
				+                used method;
			
 
				+            1 or 'v': flip the image in vertical direction;
			
 
				+            2 or 'hv': flip the image in both horizontal diction and vertical direction;
			
 
				+            3 or 'rt2lb' or 'dia': flip the image across the diagonal;
			
 
				+            4 or 'lt2rb' or 'adia': flip the image across the anti-diagonal.
			
 
				 
			
 
				     Returns:
			
 
				-        flipped image(array)
			
 
				+        np.ndarray: Flipped image.
			
 
				 
			
 
				     Raises:
			
 
				-        ValueError: Shape of image should 2d, 3d or more.
			
 
				+        ValueError: Invalid shape of images.
			
 
				 
			
 
				     Examples:
			
 
				-        --assume an image is like this:
			
 
				+        Assume an image is like this:
			
 
				 
			
 
				         img:
			
 
				         / + +
			
 
				         - / *
			
 
				         - * /
			
 
				 
			
 
				-        --we can flip it in following code:
			
 
				+        We can flip it with following code:
			
 
				 
			
 
				-        img_h = im_flip(img, 'h')
			
 
				-        img_v = im_flip(img, 'v')
			
 
				-        img_vh = im_flip(img, 2)
			
 
				-        img_rt2lb = im_flip(img, 3)
			
 
				-        img_lt2rb = im_flip(img, 4)
			
 
				+        img_h = img_flip(img, 'h')
			
 
				+        img_v = img_flip(img, 'v')
			
 
				+        img_vh = img_flip(img, 2)
			
 
				+        img_rt2lb = img_flip(img, 3)
			
 
				+        img_lt2rb = img_flip(img, 4)
			
 
				 
			
 
				-        --we can get flipped image:
			
 
				+        Then we get the flipped images:
			
 
				 
			
 
				-        img_h, flipped in horizontal direction
			
 
				+        img_h, flipped in horizontal direction:
			
 
				         + + \
			
 
				         * \ -
			
 
				         \ * -
			
 
				 
			
 
				-        img_v, flipped in vertical direction
			
 
				+        img_v, flipped in vertical direction:
			
 
				         - * \
			
 
				         - \ *
			
 
				         \ + +
			
 
				 
			
 
				-        img_vh, flipped in both horizontal diction and vertical direction
			
 
				+        img_vh, flipped in both horizontal diction and vertical direction:
			
 
				         / * -
			
 
				         * / -
			
 
				         + + /
			
 
				 
			
 
				-        img_rt2lb, flipped around the diagonal
			
 
				+        img_rt2lb, mirrored on the diagonal:
			
 
				         / | |
			
 
				         + / *
			
 
				         + * /
			
 
				 
			
 
				-        img_lt2rb, flipped around the anti-diagonal
			
 
				+        img_lt2rb, mirrored on the anti-diagonal:
			
 
				         / * +
			
 
				         * / +
			
 
				         | | /
			
 
				-
			
 
				     """
			
 
				+
			
 
				     if not len(im.shape) >= 2:
			
 
				-        raise ValueError("Shape of image should 2d, 3d or more")
			
 
				+        raise ValueError("The number of image dimensions is less than 2.")
			
 
				     if method == 0 or method == 'h':
			
 
				         return horizontal_flip(im)
			
 
				     elif method == 1 or method == 'v':
			
@@ -176,61 +174,58 @@ def lt2rb_flip(im):
 
				 # region rotation
			
 
				 def img_simple_rotate(im, method=0):
			
 
				     """
			
 
				-    rotate image in simple ways, this function provides 3 method to rotate
			
 
				-    this function can be applied to 2D or 3D images
			
 
				+    Rotate an image. 
			
 
				+    This function provides 3 rotating methods and can be applied to 2D or 3D numpy arrays.
			
 
				 
			
 
				     Args:
			
 
				-        im(array): image array
			
 
				-        method(int or string): choose the flip method, it must be one of [
			
 
				+        im (np.ndarray): Input image.
			
 
				+        method (int|string): Rotating method, which must be one of [
			
 
				                                 0, 1, 2, 90, 180, 270
			
 
				-                                ]
			
 
				-        0 or 90 : rotated in 90 degree, clockwise
			
 
				-        1 or 180: rotated in 180 degree, clockwise
			
 
				-        2 or 270: rotated in 270 degree, clockwise
			
 
				+                                ].
			
 
				+            0 or 90 : rotate the image by 90 degrees, clockwise;
			
 
				+            1 or 180: rotate the image by 180 degrees, clockwise;
			
 
				+            2 or 270: rotate the image by 270 degrees, clockwise.
			
 
				 
			
 
				     Returns:
			
 
				-        flipped image(array)
			
 
				-
			
 
				+        np.ndarray: Rotated image.
			
 
				 
			
 
				     Raises:
			
 
				-        ValueError: Shape of image should 2d, 3d or more.
			
 
				-
			
 
				+        ValueError: Invalid shape of images.
			
 
				 
			
 
				     Examples:
			
 
				-        --assume an image is like this:
			
 
				+        Assume an image is like this:
			
 
				 
			
 
				         img:
			
 
				         / + +
			
 
				         - / *
			
 
				         - * /
			
 
				 
			
 
				-        --we can rotate it in following code:
			
 
				+        We can rotate it with following code:
			
 
				 
			
 
				         img_r90 = img_simple_rotate(img, 90)
			
 
				         img_r180 = img_simple_rotate(img, 1)
			
 
				         img_r270 = img_simple_rotate(img, 2)
			
 
				 
			
 
				-        --we can get rotated image:
			
 
				+        Then we get the following rotated images:
			
 
				 
			
 
				-        img_r90, rotated in 90 degree
			
 
				+        img_r90, rotated by 90°:
			
 
				         | | \
			
 
				         * \ +
			
 
				         \ * +
			
 
				 
			
 
				-        img_r180, rotated in 180 degree
			
 
				+        img_r180, rotated by 180°:
			
 
				         / * -
			
 
				         * / -
			
 
				         + + /
			
 
				 
			
 
				-        img_r270, rotated in 270 degree
			
 
				+        img_r270, rotated by 270°:
			
 
				         + * \
			
 
				         + \ *
			
 
				         \ | |
			
 
				-
			
 
				-
			
 
				     """
			
 
				+
			
 
				     if not len(im.shape) >= 2:
			
 
				-        raise ValueError("Shape of image should 2d, 3d or more")
			
 
				+        raise ValueError("The number of image dimensions is less than 2.")
			
 
				     if method == 0 or method == 90:
			
 
				         return rot_90(im)
			
 
				     elif method == 1 or method == 180:
			
@@ -396,14 +391,15 @@ def resize_rle(rle, im_h, im_w, im_scale_x, im_scale_y, interp):
 
				 
			
 
				 
			
 
				 def to_uint8(im, is_linear=False):
			
 
				-    """ Convert raster to uint8.
			
 
				+    """
			
 
				+    Convert raster data to uint8 type.
			
 
				     
			
 
				     Args:
			
 
				-        im (np.ndarray): The image.
			
 
				+        im (np.ndarray): Input raster image.
			
 
				         is_linear (bool, optional): Use 2% linear stretch or not. Default is False.
			
 
				 
			
 
				     Returns:
			
 
				-        np.ndarray: Image on uint8.
			
 
				+        np.ndarray: Image data with unit8 type.
			
 
				     """
			
 
				 
			
 
				     # 2% linear stretch
			
@@ -448,16 +444,18 @@ def to_uint8(im, is_linear=False):
 
				 
			
 
				 
			
 
				 def to_intensity(im):
			
 
				-    """ calculate SAR data's intensity diagram.
			
 
				+    """
			
 
				+    Calculate the intensity of SAR data.
			
 
				 
			
 
				     Args:
			
 
				-        im (np.ndarray): The SAR image.
			
 
				+        im (np.ndarray): SAR image.
			
 
				 
			
 
				     Returns:
			
 
				-        np.ndarray: Intensity diagram.
			
 
				+        np.ndarray: Intensity image.
			
 
				     """
			
 
				+
			
 
				     if len(im.shape) != 2:
			
 
				-        raise ValueError("im's shape must be 2.")
			
 
				+        raise ValueError("`len(im.shape) must be 2.")
			
 
				     # the type is complex means this is a SAR data
			
 
				     if isinstance(type(im[0, 0]), complex):
			
 
				         im = abs(im)
			
@@ -465,15 +463,18 @@ def to_intensity(im):
 
				 
			
 
				 
			
 
				 def select_bands(im, band_list=[1, 2, 3]):
			
 
				-    """ Select bands.
			
 
				+    """
			
 
				+    Select bands of a multi-band image.
			
 
				 
			
 
				     Args:
			
 
				-        im (np.ndarray): The image.
			
 
				-        band_list (list, optional): Bands of selected (Start with 1). Defaults to [1, 2, 3].
			
 
				+        im (np.ndarray): Input image.
			
 
				+        band_list (list, optional): Bands to select (band index start from 1). 
			
 
				+            Defaults to [1, 2, 3].
			
 
				 
			
 
				     Returns:
			
 
				-        np.ndarray: The image after band selected.
			
 
				+        np.ndarray: Image with selected bands.
			
 
				     """
			
 
				+
			
 
				     if len(im.shape) == 2:  # just have one channel
			
 
				         return im
			
 
				     if not isinstance(band_list, list) or len(band_list) == 0:
			
@@ -492,14 +493,14 @@ def select_bands(im, band_list=[1, 2, 3]):
 
				 
			
 
				 def dehaze(im, gamma=False):
			
 
				     """
			
 
				-    Single image haze removal using dark channel prior.
			
 
				+    Perform single image haze removal using dark channel prior.
			
 
				 
			
 
				     Args:
			
 
				         im (np.ndarray): Input image.
			
 
				         gamma (bool, optional): Use gamma correction or not. Defaults to False.
			
 
				 
			
 
				     Returns:
			
 
				-        np.ndarray: The image after dehazed.
			
 
				+        np.ndarray: Output dehazed image.
			
 
				     """
			
 
				 
			
 
				     def _guided_filter(I, p, r, eps):
			
@@ -549,7 +550,8 @@ def match_histograms(im, ref):
 
				 
			
 
				     Args:
			
 
				         im (np.ndarray): Input image.
			
 
				-        ref (np.ndarray): Reference image to match histogram of. `ref` must have the same number of channels as `im`.
			
 
				+        ref (np.ndarray): Reference image to match histogram of. `ref` must have 
			
 
				+            the same number of channels as `im`.
			
 
				 
			
 
				     Returns:
			
 
				         np.ndarray: Transformed input image.
			
@@ -557,6 +559,7 @@ def match_histograms(im, ref):
 
				     Raises:
			
 
				         ValueError: When the number of channels of `ref` differs from that of im`.
			
 
				     """
			
 
				+
			
 
				     # TODO: Check the data types of the inputs to see if they are supported by skimage
			
 
				     return exposure.match_histograms(
			
 
				         im, ref, channel_axis=-1 if im.ndim > 2 else None)
			
@@ -568,10 +571,12 @@ def match_by_regression(im, ref, pif_loc=None):
 
				 
			
 
				     Args:
			
 
				         im (np.ndarray): Input image.
			
 
				-        ref (np.ndarray): Reference image to match. `ref` must have the same shape as `im`.
			
 
				-        pif_loc (tuple|None, optional): Spatial locations where pseudo-invariant features (PIFs) are obtained. If 
			
 
				-            `pif_loc` is set to None, all pixels in the image will be used as training samples for the regression model. 
			
 
				-            In other cases, `pif_loc` should be a tuple of np.ndarrays. Default: None.
			
 
				+        ref (np.ndarray): Reference image to match. `ref` must have the same shape 
			
 
				+            as `im`.
			
 
				+        pif_loc (tuple|None, optional): Spatial locations where pseudo-invariant 
			
 
				+            features (PIFs) are obtained. If `pif_loc` is set to None, all pixels in 
			
 
				+            the image will be used as training samples for the regression model. In 
			
 
				+            other cases, `pif_loc` should be a tuple of np.ndarrays. Default: None.
			
 
				 
			
 
				     Returns:
			
 
				         np.ndarray: Transformed input image.
			
@@ -609,15 +614,16 @@ def match_by_regression(im, ref, pif_loc=None):
 
				 
			
 
				 def inv_pca(im, joblib_path):
			
 
				     """
			
 
				-    Restore PCA result.
			
 
				+    Perform inverse PCA transformation.
			
 
				 
			
 
				     Args:
			
 
				-        im (np.ndarray): The input image after PCA.
			
 
				-        joblib_path (str): Path of *.joblib about PCA.
			
 
				+        im (np.ndarray): Input image after performing PCA.
			
 
				+        joblib_path (str): Path of *.joblib file that stores PCA information.
			
 
				 
			
 
				     Returns:
			
 
				-        np.ndarray: The raw input image.
			
 
				+        np.ndarray: Reconstructed input image.
			
 
				     """
			
 
				+
			
 
				     pca = load(joblib_path)
			
 
				     H, W, C = im.shape
			
 
				     n_im = np.reshape(im, (-1, C))
			
--- a/paddlers/transforms/operators.py
+++ b/paddlers/transforms/operators.py
@@ -123,7 +123,7 @@ class Compose(object):
 
				 
			
 
				 class Transform(object):
			
 
				     """
			
 
				-    Parent class of all data augmentation operations
			
 
				+    Parent class of all data augmentation operators.
			
 
				     """
			
 
				 
			
 
				     def __init__(self):
			
@@ -171,12 +171,15 @@ class DecodeImg(Transform):
 
				     Decode image(s) in input.
			
 
				     
			
 
				     Args:
			
 
				-        to_rgb (bool, optional): If True, convert input image(s) from BGR format to RGB format. Defaults to True.
			
 
				-        to_uint8 (bool, optional): If True, quantize and convert decoded image(s) to uint8 type. Defaults to True.
			
 
				-        decode_bgr (bool, optional): If True, automatically interpret a non-geo image (e.g., jpeg images) as a BGR image. 
			
 
				-            Defaults to True.
			
 
				-        decode_sar (bool, optional): If True, automatically interpret a two-channel geo image (e.g. geotiff images) as a 
			
 
				-            SAR image, set this argument to True. Defaults to True.
			
 
				+        to_rgb (bool, optional): If True, convert input image(s) from BGR format to 
			
 
				+            RGB format. Defaults to True.
			
 
				+        to_uint8 (bool, optional): If True, quantize and convert decoded image(s) to 
			
 
				+            uint8 type. Defaults to True.
			
 
				+        decode_bgr (bool, optional): If True, automatically interpret a non-geo image 
			
 
				+            (e.g., jpeg images) as a BGR image. Defaults to True.
			
 
				+        decode_sar (bool, optional): If True, automatically interpret a two-channel 
			
 
				+            geo image (e.g. geotiff images) as a SAR image, set this argument to 
			
 
				+            True. Defaults to True.
			
 
				     """
			
 
				 
			
 
				     def __init__(self,
			
@@ -262,7 +265,7 @@ class DecodeImg(Transform):
 
				             sample (dict): Input sample.
			
 
				 
			
 
				         Returns:
			
 
				-            dict: Decoded sample.
			
 
				+            dict: Sample with decoded images.
			
 
				         """
			
 
				 
			
 
				         if 'image' in sample:
			
@@ -299,17 +302,20 @@ class Resize(Transform):
 
				     """
			
 
				     Resize input.
			
 
				 
			
 
				-    - If target_size is an int, resize the image(s) to (target_size, target_size).
			
 
				-    - If target_size is a list or tuple, resize the image(s) to target_size.
			
 
				-    Attention: If interp is 'RANDOM', the interpolation method will be chose randomly.
			
 
				+    - If `target_size` is an int, resize the image(s) to (`target_size`, `target_size`).
			
 
				+    - If `target_size` is a list or tuple, resize the image(s) to `target_size`.
			
 
				+    Attention: If `interp` is 'RANDOM', the interpolation method will be chosen randomly.
			
 
				 
			
 
				     Args:
			
 
				-        target_size (int, list[int] | tuple[int]): Target size. If int, the height and width share the same target_size.
			
 
				-            Otherwise, target_size represents [target height, target width].
			
 
				-        interp ({'NEAREST', 'LINEAR', 'CUBIC', 'AREA', 'LANCZOS4', 'RANDOM'}, optional):
			
 
				-            Interpolation method of resize. Defaults to 'LINEAR'.
			
 
				-        keep_ratio (bool): the resize scale of width/height is same and width/height after resized is not greater
			
 
				-            than target width/height. Defaults to False.
			
 
				+        target_size (int | list[int] | tuple[int]): Target size. If it is an integer, the
			
 
				+            target height and width will be both set to `target_size`. Otherwise, 
			
 
				+            `target_size` represents [target height, target width].
			
 
				+        interp (str, optional): Interpolation method for resizing image(s). One of 
			
 
				+            {'NEAREST', 'LINEAR', 'CUBIC', 'AREA', 'LANCZOS4', 'RANDOM'}. 
			
 
				+            Defaults to 'LINEAR'.
			
 
				+        keep_ratio (bool, optional): If True, the scaling factor of width and height will 
			
 
				+            be set to same value, and height/width of the resized image will be not 
			
 
				+            greater than the target width/height. Defaults to False.
			
 
				 
			
 
				     Raises:
			
 
				         TypeError: Invalid type of target_size.
			
@@ -420,20 +426,18 @@ class RandomResize(Transform):
 
				     """
			
 
				     Resize input to random sizes.
			
 
				 
			
 
				-    Attention: If interp is 'RANDOM', the interpolation method will be chose randomly.
			
 
				+    Attention: If `interp` is 'RANDOM', the interpolation method will be chosen randomly.
			
 
				 
			
 
				     Args:
			
 
				-        target_sizes (list[int] | list[list | tuple] | tuple[list | tuple]):
			
 
				-            Multiple target sizes, each target size is an int or list/tuple.
			
 
				-        interp ({'NEAREST', 'LINEAR', 'CUBIC', 'AREA', 'LANCZOS4', 'RANDOM'}, optional):
			
 
				-            Interpolation method of resize. Defaults to 'LINEAR'.
			
 
				+        target_sizes (list[int] | list[list|tuple] | tuple[list|tuple]):
			
 
				+            Multiple target sizes, each of which should be int, list, or tuple.
			
 
				+        interp (str, optional): Interpolation method for resizing image(s). One of 
			
 
				+            {'NEAREST', 'LINEAR', 'CUBIC', 'AREA', 'LANCZOS4', 'RANDOM'}. 
			
 
				+            Defaults to 'LINEAR'.
			
 
				 
			
 
				     Raises:
			
 
				-        TypeError: Invalid type of target_size.
			
 
				+        TypeError: Invalid type of `target_size`.
			
 
				         ValueError: Invalid interpolation method.
			
 
				-
			
 
				-    See Also:
			
 
				-        Resize input to a specific size.
			
 
				     """
			
 
				 
			
 
				     def __init__(self, target_sizes, interp='LINEAR'):
			
@@ -459,14 +463,17 @@ class RandomResize(Transform):
 
				 
			
 
				 class ResizeByShort(Transform):
			
 
				     """
			
 
				-    Resize input with keeping the aspect ratio.
			
 
				+    Resize input while keeping the aspect ratio.
			
 
				 
			
 
				-    Attention: If interp is 'RANDOM', the interpolation method will be chose randomly.
			
 
				+    Attention: If `interp` is 'RANDOM', the interpolation method will be chosen randomly.
			
 
				 
			
 
				     Args:
			
 
				         short_size (int): Target size of the shorter side of the image(s).
			
 
				-        max_size (int, optional): The upper bound of longer side of the image(s). If max_size is -1, no upper bound is applied. Defaults to -1.
			
 
				-        interp ({'NEAREST', 'LINEAR', 'CUBIC', 'AREA', 'LANCZOS4', 'RANDOM'}, optional): Interpolation method of resize. Defaults to 'LINEAR'.
			
 
				+        max_size (int, optional): Upper bound of longer side of the image(s). If
			
 
				+            `max_size` is -1, no upper bound will be applied. Defaults to -1.
			
 
				+        interp (str, optional): Interpolation method for resizing image(s). One of 
			
 
				+            {'NEAREST', 'LINEAR', 'CUBIC', 'AREA', 'LANCZOS4', 'RANDOM'}. 
			
 
				+            Defaults to 'LINEAR'.
			
 
				 
			
 
				     Raises:
			
 
				         ValueError: Invalid interpolation method.
			
@@ -498,21 +505,24 @@ class ResizeByShort(Transform):
 
				 
			
 
				 class RandomResizeByShort(Transform):
			
 
				     """
			
 
				-    Resize input to random sizes with keeping the aspect ratio.
			
 
				+    Resize input to random sizes while keeping the aspect ratio.
			
 
				 
			
 
				-    Attention: If interp is 'RANDOM', the interpolation method will be chose randomly.
			
 
				+    Attention: If `interp` is 'RANDOM', the interpolation method will be chosen randomly.
			
 
				 
			
 
				     Args:
			
 
				         short_sizes (list[int]): Target size of the shorter side of the image(s).
			
 
				-        max_size (int, optional): The upper bound of longer side of the image(s). If max_size is -1, no upper bound is applied. Defaults to -1.
			
 
				-        interp ({'NEAREST', 'LINEAR', 'CUBIC', 'AREA', 'LANCZOS4', 'RANDOM'}, optional): Interpolation method of resize. Defaults to 'LINEAR'.
			
 
				+        max_size (int, optional): Upper bound of longer side of the image(s). 
			
 
				+            If `max_size` is -1, no upper bound will be applied. Defaults to -1.
			
 
				+        interp (str, optional): Interpolation method for resizing image(s). One of 
			
 
				+            {'NEAREST', 'LINEAR', 'CUBIC', 'AREA', 'LANCZOS4', 'RANDOM'}. 
			
 
				+            Defaults to 'LINEAR'.
			
 
				 
			
 
				     Raises:
			
 
				-        TypeError: Invalid type of target_size.
			
 
				+        TypeError: Invalid type of `target_size`.
			
 
				         ValueError: Invalid interpolation method.
			
 
				 
			
 
				     See Also:
			
 
				-        ResizeByShort: Resize image(s) in input with keeping the aspect ratio.
			
 
				+        ResizeByShort: Resize image(s) in input while keeping the aspect ratio.
			
 
				     """
			
 
				 
			
 
				     def __init__(self, short_sizes, max_size=-1, interp='LINEAR'):
			
@@ -555,29 +565,30 @@ class ResizeByLong(Transform):
 
				 
			
 
				 class RandomFlipOrRotate(Transform):
			
 
				     """
			
 
				-    Flip or Rotate an image in different ways with a certain probability.
			
 
				+    Flip or Rotate an image in different directions with a certain probability.
			
 
				 
			
 
				     Args:
			
 
				-        probs (list of float): Probabilities of flipping and rotation. Default: [0.35,0.25].
			
 
				-        probsf (list of float): Probabilities of 5 flipping mode
			
 
				-                                (horizontal, vertical, both horizontal diction and vertical, diagonal, anti-diagonal).
			
 
				-                                Default: [0.3, 0.3, 0.2, 0.1, 0.1].
			
 
				-        probsr (list of float): Probabilities of 3 rotation mode(90°, 180°, 270° clockwise). Default: [0.25,0.5,0.25].
			
 
				+        probs (list[float]): Probabilities of performing flipping and rotation. 
			
 
				+            Default: [0.35,0.25].
			
 
				+        probsf (list[float]): Probabilities of 5 flipping modes (horizontal, 
			
 
				+            vertical, both horizontal diction and vertical, diagonal, 
			
 
				+            anti-diagonal). Default: [0.3, 0.3, 0.2, 0.1, 0.1].
			
 
				+        probsr (list[float]): Probabilities of 3 rotation modes (90°, 180°, 270° 
			
 
				+            clockwise). Default: [0.25,0.5,0.25].
			
 
				 
			
 
				     Examples:
			
 
				 
			
 
				         from paddlers import transforms as T
			
 
				 
			
 
				-        # 定义数据增强
			
 
				+        # Define operators for data augmentation
			
 
				         train_transforms = T.Compose([
			
 
				             T.DecodeImg(),
			
 
				             T.RandomFlipOrRotate(
			
 
				-                probs  = [0.3, 0.2]             # 进行flip增强的概率是0.3，进行rotate增强的概率是0.2，不变的概率是0.5
			
 
				-                probsf = [0.3, 0.25, 0, 0, 0]   # flip增强时，使用水平flip、垂直flip的概率分别是0.3、0.25，水平且垂直flip、对角线flip、反对角线flip概率均为0，不变的概率是0.45
			
 
				-                probsr = [0, 0.65, 0]),         # rotate增强时，顺时针旋转90度的概率是0，顺时针旋转180度的概率是0.65，顺时针旋转90度的概率是0，不变的概率是0.35
			
 
				-            T.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225])
			
 
				+                probs  = [0.3, 0.2]             # p=0.3 to flip the image，p=0.2 to rotate the image，p=0.5 to keep the image unchanged.
			
 
				+                probsf = [0.3, 0.25, 0, 0, 0]   # p=0.3 and p=0.25 to perform horizontal and vertical flipping; probility of no-flipping is 0.45.
			
 
				+                probsr = [0, 0.65, 0]),         # p=0.65 to rotate the image by 180°; probility of no-rotation is 0.35.
			
 
				+            T.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225]),
			
 
				         ])
			
 
				-
			
 
				     """
			
 
				 
			
 
				     def __init__(self,
			
@@ -615,15 +626,16 @@ class RandomFlipOrRotate(Transform):
 
				         )
			
 
				 
			
 
				     def get_probs_range(self, probs):
			
 
				-        '''
			
 
				-        Change various probabilities into cumulative probabilities
			
 
				+        """
			
 
				+        Change list of probabilities into cumulative probability intervals.
			
 
				 
			
 
				         Args:
			
 
				-            probs(list of float): probabilities of different mode, shape:[n]
			
 
				+            probs (list[float]): Probabilities of different modes, shape: [n].
			
 
				 
			
 
				         Returns:
			
 
				-            probability intervals(list of binary list): shape:[n, 2]
			
 
				-        '''
			
 
				+            list[list]: Probability intervals, shape: [n, 2].
			
 
				+        """
			
 
				+
			
 
				         ps = []
			
 
				         last_prob = 0
			
 
				         for prob in probs:
			
@@ -635,17 +647,17 @@ class RandomFlipOrRotate(Transform):
 
				         return ps
			
 
				 
			
 
				     def judge_probs_range(self, p, probs):
			
 
				-        '''
			
 
				-        Judge whether a probability value falls within the given probability interval
			
 
				+        """
			
 
				+        Judge whether the value of `p` falls within the given probability interval.
			
 
				 
			
 
				         Args:
			
 
				-            p(float): probability
			
 
				-            probs(list of binary list): probability intervals, shape:[n, 2]
			
 
				+            p (float): Value between 0 and 1.
			
 
				+            probs (list[list]): Probability intervals, shape: [n, 2].
			
 
				 
			
 
				         Returns:
			
 
				-            mode id(int):the probability interval number where the input probability falls,
			
 
				-                         if return -1, the image will remain as it is and will not be processed
			
 
				-        '''
			
 
				+            int: Interval where the input probability falls into.
			
 
				+        """
			
 
				+
			
 
				         for id, id_range in enumerate(probs):
			
 
				             if p > id_range[0] and p < id_range[1]:
			
 
				                 return id
			
@@ -702,7 +714,7 @@ class RandomHorizontalFlip(Transform):
 
				     Randomly flip the input horizontally.
			
 
				 
			
 
				     Args:
			
 
				-        prob(float, optional): Probability of flipping the input. Defaults to .5.
			
 
				+        prob (float, optional): Probability of flipping the input. Defaults to .5.
			
 
				     """
			
 
				 
			
 
				     def __init__(self, prob=0.5):
			
@@ -760,7 +772,7 @@ class RandomVerticalFlip(Transform):
 
				     Randomly flip the input vertically.
			
 
				 
			
 
				     Args:
			
 
				-        prob(float, optional): Probability of flipping the input. Defaults to .5.
			
 
				+        prob (float, optional): Probability of flipping the input. Defaults to .5.
			
 
				     """
			
 
				 
			
 
				     def __init__(self, prob=0.5):
			
@@ -821,10 +833,14 @@ class Normalize(Transform):
 
				     3. im = im / std
			
 
				 
			
 
				     Args:
			
 
				-        mean(list[float] | tuple[float], optional): Mean of input image(s). Defaults to [0.485, 0.456, 0.406].
			
 
				-        std(list[float] | tuple[float], optional): Standard deviation of input image(s). Defaults to [0.229, 0.224, 0.225].
			
 
				-        min_val(list[float] | tuple[float], optional): Minimum value of input image(s). Defaults to [0, 0, 0, ].
			
 
				-        max_val(list[float] | tuple[float], optional): Max value of input image(s). Defaults to [255., 255., 255.].
			
 
				+        mean (list[float] | tuple[float], optional): Mean of input image(s). 
			
 
				+            Defaults to [0.485, 0.456, 0.406].
			
 
				+        std (list[float] | tuple[float], optional): Standard deviation of input 
			
 
				+            image(s). Defaults to [0.229, 0.224, 0.225].
			
 
				+        min_val (list[float] | tuple[float], optional): Minimum value of input 
			
 
				+            image(s). Defaults to [0, 0, 0, ].
			
 
				+        max_val (list[float] | tuple[float], optional): Max value of input image(s). 
			
 
				+            Defaults to [255., 255., 255.].
			
 
				     """
			
 
				 
			
 
				     def __init__(self,
			
@@ -872,12 +888,13 @@ class Normalize(Transform):
 
				 
			
 
				 class CenterCrop(Transform):
			
 
				     """
			
 
				-    Crop the input at the center.
			
 
				+    Crop the input image(s) at the center.
			
 
				     1. Locate the center of the image.
			
 
				-    2. Crop the sample.
			
 
				+    2. Crop the image.
			
 
				 
			
 
				     Args:
			
 
				-        crop_size(int, optional): target size of the cropped image(s). Defaults to 224.
			
 
				+        crop_size (int, optional): Target size of the cropped image(s). 
			
 
				+            Defaults to 224.
			
 
				     """
			
 
				 
			
 
				     def __init__(self, crop_size=224):
			
@@ -908,22 +925,27 @@ class CenterCrop(Transform):
 
				 class RandomCrop(Transform):
			
 
				     """
			
 
				     Randomly crop the input.
			
 
				-    1. Compute the height and width of cropped area according to aspect_ratio and scaling.
			
 
				+    1. Compute the height and width of cropped area according to `aspect_ratio` and 
			
 
				+        `scaling`.
			
 
				     2. Locate the upper left corner of cropped area randomly.
			
 
				     3. Crop the image(s).
			
 
				-    4. Resize the cropped area to crop_size by crop_size.
			
 
				+    4. Resize the cropped area to `crop_size` x `crop_size`.
			
 
				 
			
 
				     Args:
			
 
				-        crop_size(int, list[int] | tuple[int]): Target size of the cropped area. If None, the cropped area will not be
			
 
				-            resized. Defaults to None.
			
 
				-        aspect_ratio (list[float], optional): Aspect ratio of cropped region in [min, max] format. Defaults to [.5, 2.].
			
 
				-        thresholds (list[float], optional): Iou thresholds to decide a valid bbox crop.
			
 
				-            Defaults to [.0, .1, .3, .5, .7, .9].
			
 
				-        scaling (list[float], optional): Ratio between the cropped region and the original image in [min, max] format.
			
 
				-            Defaults to [.3, 1.].
			
 
				-        num_attempts (int, optional): The number of tries before giving up. Defaults to 50.
			
 
				-        allow_no_crop (bool, optional): Whether returning without doing crop is allowed. Defaults to True.
			
 
				-        cover_all_box (bool, optional): Whether to ensure all bboxes are covered in the final crop. Defaults to False.
			
 
				+        crop_size (int | list[int] | tuple[int]): Target size of the cropped area. If 
			
 
				+            None, the cropped area will not be resized. Defaults to None.
			
 
				+        aspect_ratio (list[float], optional): Aspect ratio of cropped region in 
			
 
				+            [min, max] format. Defaults to [.5, 2.].
			
 
				+        thresholds (list[float], optional): Iou thresholds to decide a valid bbox 
			
 
				+            crop. Defaults to [.0, .1, .3, .5, .7, .9].
			
 
				+        scaling (list[float], optional): Ratio between the cropped region and the 
			
 
				+            original image in [min, max] format. Defaults to [.3, 1.].
			
 
				+        num_attempts (int, optional): Max number of tries before giving up. 
			
 
				+            Defaults to 50.
			
 
				+        allow_no_crop (bool, optional): Whether returning without doing crop is 
			
 
				+            allowed. Defaults to True.
			
 
				+        cover_all_box (bool, optional): Whether to ensure all bboxes be covered in 
			
 
				+            the final crop. Defaults to False.
			
 
				     """
			
 
				 
			
 
				     def __init__(self,
			
@@ -1107,9 +1129,10 @@ class RandomCrop(Transform):
 
				 class RandomScaleAspect(Transform):
			
 
				     """
			
 
				     Crop input image(s) and resize back to original sizes.
			
 
				+
			
 
				     Args: 
			
 
				-        min_scale (float): Minimum ratio between the cropped region and the original image.
			
 
				-            If 0, image(s) will not be cropped. Defaults to .5.
			
 
				+        min_scale (float): Minimum ratio between the cropped region and the original
			
 
				+            image. If 0, image(s) will not be cropped. Defaults to .5.
			
 
				         aspect_ratio (float): Aspect ratio of cropped region. Defaults to .33.
			
 
				     """
			
 
				 
			
@@ -1135,10 +1158,13 @@ class RandomExpand(Transform):
 
				     Randomly expand the input by padding according to random offsets.
			
 
				 
			
 
				     Args:
			
 
				-        upper_ratio(float, optional): The maximum ratio to which the original image is expanded. Defaults to 4..
			
 
				-        prob(float, optional): The probability of apply expanding. Defaults to .5.
			
 
				-        im_padding_value(list[float] | tuple[float], optional): RGB filling value for the image. Defaults to (127.5, 127.5, 127.5).
			
 
				-        label_padding_value(int, optional): Filling value for the mask. Defaults to 255.
			
 
				+        upper_ratio (float, optional): Maximum ratio to which the original image 
			
 
				+            is expanded. Defaults to 4..
			
 
				+        prob (float, optional): Probability of apply expanding. Defaults to .5.
			
 
				+        im_padding_value (list[float] | tuple[float], optional): RGB filling value 
			
 
				+            for the image. Defaults to (127.5, 127.5, 127.5).
			
 
				+        label_padding_value (int, optional): Filling value for the mask. 
			
 
				+            Defaults to 255.
			
 
				 
			
 
				     See Also:
			
 
				         paddlers.transforms.Pad
			
@@ -1187,15 +1213,20 @@ class Pad(Transform):
 
				                  label_padding_value=255,
			
 
				                  size_divisor=32):
			
 
				         """
			
 
				-        Pad image to a specified size or multiple of size_divisor.
			
 
				+        Pad image to a specified size or multiple of `size_divisor`.
			
 
				 
			
 
				         Args:
			
 
				-            target_size(int, Sequence, optional): Image target size, if None, pad to multiple of size_divisor. Defaults to None.
			
 
				-            pad_mode({-1, 0, 1, 2}, optional): Pad mode, currently only supports four modes [-1, 0, 1, 2]. if -1, use specified offsets
			
 
				-                if 0, only pad to right and bottom. If 1, pad according to center. If 2, only pad left and top. Defaults to 0.
			
 
				-            im_padding_value(Sequence[float]): RGB value of pad area. Defaults to (127.5, 127.5, 127.5).
			
 
				-            label_padding_value(int, optional): Filling value for the mask. Defaults to 255.
			
 
				-            size_divisor(int): Image width and height after padding is a multiple of coarsest_stride.
			
 
				+            target_size (list[int] | tuple[int], optional): Image target size, if None, pad to 
			
 
				+                multiple of size_divisor. Defaults to None.
			
 
				+            pad_mode (int, optional): Pad mode. Currently only four modes are supported:
			
 
				+                [-1, 0, 1, 2]. if -1, use specified offsets. If 0, only pad to right and bottom
			
 
				+                If 1, pad according to center. If 2, only pad left and top. Defaults to 0.
			
 
				+            im_padding_value (list[float] | tuple[float]): RGB value of padded area. 
			
 
				+                Defaults to (127.5, 127.5, 127.5).
			
 
				+            label_padding_value (int, optional): Filling value for the mask. 
			
 
				+                Defaults to 255.
			
 
				+            size_divisor (int): Image width and height after padding will be a multiple of 
			
 
				+                `size_divisor`.
			
 
				         """
			
 
				         super(Pad, self).__init__()
			
 
				         if isinstance(target_size, (list, tuple)):
			
@@ -1306,8 +1337,10 @@ class MixupImage(Transform):
 
				         Mixup two images and their gt_bbbox/gt_score.
			
 
				 
			
 
				         Args:
			
 
				-            alpha (float, optional): Alpha parameter of beta distribution. Defaults to 1.5.
			
 
				-            beta (float, optional): Beta parameter of beta distribution. Defaults to 1.5.
			
 
				+            alpha (float, optional): Alpha parameter of beta distribution. 
			
 
				+                Defaults to 1.5.
			
 
				+            beta (float, optional): Beta parameter of beta distribution. 
			
 
				+                Defaults to 1.5.
			
 
				         """
			
 
				         super(MixupImage, self).__init__()
			
 
				         if alpha <= 0.0:
			
@@ -1385,18 +1418,25 @@ class RandomDistort(Transform):
 
				     Random color distortion.
			
 
				 
			
 
				     Args:
			
 
				-        brightness_range(float, optional): Range of brightness distortion. Defaults to .5.
			
 
				-        brightness_prob(float, optional): Probability of brightness distortion. Defaults to .5.
			
 
				-        contrast_range(float, optional): Range of contrast distortion. Defaults to .5.
			
 
				-        contrast_prob(float, optional): Probability of contrast distortion. Defaults to .5.
			
 
				-        saturation_range(float, optional): Range of saturation distortion. Defaults to .5.
			
 
				-        saturation_prob(float, optional): Probability of saturation distortion. Defaults to .5.
			
 
				-        hue_range(float, optional): Range of hue distortion. Defaults to .5.
			
 
				-        hue_prob(float, optional): Probability of hue distortion. Defaults to .5.
			
 
				-        random_apply (bool, optional): whether to apply in random (yolo) or fixed (SSD)
			
 
				-            order. Defaults to True.
			
 
				-        count (int, optional): the number of doing distortion. Defaults to 4.
			
 
				-        shuffle_channel (bool, optional): whether to swap channels randomly. Defaults to False.
			
 
				+        brightness_range (float, optional): Range of brightness distortion. 
			
 
				+            Defaults to .5.
			
 
				+        brightness_prob (float, optional): Probability of brightness distortion. 
			
 
				+            Defaults to .5.
			
 
				+        contrast_range (float, optional): Range of contrast distortion. 
			
 
				+            Defaults to .5.
			
 
				+        contrast_prob (float, optional): Probability of contrast distortion. 
			
 
				+            Defaults to .5.
			
 
				+        saturation_range (float, optional): Range of saturation distortion. 
			
 
				+            Defaults to .5.
			
 
				+        saturation_prob (float, optional): Probability of saturation distortion. 
			
 
				+            Defaults to .5.
			
 
				+        hue_range (float, optional): Range of hue distortion. Defaults to .5.
			
 
				+        hue_prob (float, optional): Probability of hue distortion. Defaults to .5.
			
 
				+        random_apply (bool, optional): Apply the transformation in random (yolo) or
			
 
				+            fixed (SSD) order. Defaults to True.
			
 
				+        count (int, optional): Number of distortions to apply. Defaults to 4.
			
 
				+        shuffle_channel (bool, optional): Whether to swap channels randomly. 
			
 
				+            Defaults to False.
			
 
				     """
			
 
				 
			
 
				     def __init__(self,
			
@@ -1632,7 +1672,8 @@ class SelectBand(Transform):
 
				     Select a set of bands of input image(s).
			
 
				 
			
 
				     Args: 
			
 
				-        band_list (list, optional): Bands to select (the band index starts with 1). Defaults to [1, 2, 3].
			
 
				+        band_list (list, optional): Bands to select (band index starts from 1). 
			
 
				+            Defaults to [1, 2, 3].
			
 
				     """
			
 
				 
			
 
				     def __init__(self, band_list=[1, 2, 3]):
			
@@ -1653,11 +1694,12 @@ class SelectBand(Transform):
 
				 class _PadBox(Transform):
			
 
				     def __init__(self, num_max_boxes=50):
			
 
				         """
			
 
				-        Pad zeros to bboxes if number of bboxes is less than num_max_boxes.
			
 
				+        Pad zeros to bboxes if number of bboxes is less than `num_max_boxes`.
			
 
				 
			
 
				         Args:
			
 
				-            num_max_boxes (int, optional): the max number of bboxes. Defaults to 50.
			
 
				+            num_max_boxes (int, optional): Max number of bboxes. Defaults to 50.
			
 
				         """
			
 
				+
			
 
				         self.num_max_boxes = num_max_boxes
			
 
				         super(_PadBox, self).__init__()
			
 
				 
			
@@ -1741,7 +1783,8 @@ class RandomSwap(Transform):
 
				     Randomly swap multi-temporal images.
			
 
				 
			
 
				     Args:
			
 
				-        prob (float, optional): Probability of swapping the input images. Default: 0.2.
			
 
				+        prob (float, optional): Probability of swapping the input images. 
			
 
				+            Default: 0.2.
			
 
				     """
			
 
				 
			
 
				     def __init__(self, prob=0.2):
			
--- a/paddlers/utils/download.py
+++ b/paddlers/utils/download.py
@@ -50,8 +50,7 @@ def md5check(fullname, md5sum=None):
 
				 
			
 
				 def move_and_merge_tree(src, dst):
			
 
				     """
			
 
				-    Move src directory to dst, if dst is already exists,
			
 
				-    merge src to dst
			
 
				+    Move `src` to `dst`. If `dst` already exists, merge `src` with `dst`.
			
 
				     """
			
 
				     if not osp.exists(dst):
			
 
				         shutil.move(src, dst)
			
@@ -71,10 +70,10 @@ def move_and_merge_tree(src, dst):
 
				 
			
 
				 def download(url, path, md5sum=None):
			
 
				     """
			
 
				-    Download from url, save to path.
			
 
				+    Download from `url` and save the result to `path`.
			
 
				 
			
 
				-    url (str): download url
			
 
				-    path (str): download to given path
			
 
				+    url (str): URL.
			
 
				+    path (str): Path to save the downloaded result.
			
 
				     """
			
 
				     if not osp.exists(path):
			
 
				         os.makedirs(path)
			
@@ -136,7 +135,7 @@ def download(url, path, md5sum=None):
 
				 
			
 
				 def decompress(fname):
			
 
				     """
			
 
				-    Decompress for zip and tar file
			
 
				+    Decompress zip or tar files.
			
 
				     """
			
 
				     logging.info("Decompressing {}...".format(fname))
			
 
				 
			
--- a/paddlers/utils/env.py
+++ b/paddlers/utils/env.py
@@ -22,7 +22,9 @@ import paddle
 
				 
			
 
				 
			
 
				 def get_environ_info():
			
 
				-    """collect environment information"""
			
 
				+    """
			
 
				+    Collect environment information.
			
 
				+    """
			
 
				 
			
 
				     env_info = dict()
			
 
				     # TODO is_compiled_with_cuda() has not been moved
			
--- a/paddlers/utils/stats.py
+++ b/paddlers/utils/stats.py
@@ -19,8 +19,8 @@ import numpy as np
 
				 
			
 
				 
			
 
				 class SmoothedValue(object):
			
 
				-    """Track a series of values and provide access to smoothed values over a
			
 
				-    window.
			
 
				+    """
			
 
				+    Track a series of values and provide access to smoothed values over window.
			
 
				     """
			
 
				 
			
 
				     def __init__(self, window_size=20):
			
--- a/paddlers/utils/utils.py
+++ b/paddlers/utils/utils.py
@@ -53,9 +53,9 @@ def get_single_card_bs(batch_size):
 
				         # Evaluation of detection task only supports single card with batch size 1
			
 
				         return batch_size
			
 
				     else:
			
 
				-        raise Exception("Please support correct batch_size, \
			
 
				+        raise ValueError("Please support correct batch_size, \
			
 
				                         which can be divided by available cards({}) in {}"
			
 
				-                        .format(card_num, place))
			
 
				+                         .format(card_num, place))
			
 
				 
			
 
				 
			
 
				 def dict2str(dict_input):
			
@@ -113,7 +113,7 @@ class EarlyStop:
 
				         self.max = 0
			
 
				         self.thresh = thresh
			
 
				         if patience < 1:
			
 
				-            raise Exception("Argument patience should be a positive integer.")
			
 
				+            raise ValueError("Argument patience should be a positive integer.")
			
 
				 
			
 
				     def __call__(self, current_score):
			
 
				         if self.score is None:
			
--- a/tests/data/data_utils.py
+++ b/tests/data/data_utils.py
@@ -332,7 +332,7 @@ def build_input_from_file(file_list, prefix='', task='auto', label_list=None):
 
				         prefix (str, optional): A nonempty `prefix` specifies the directory that stores the images and annotation files. Default: ''.
			
 
				         task (str, optional): Supported values are 'seg', 'det', 'cd', 'clas', and 'auto'. When `task` is set to 'auto', automatically determine the task based on the input. 
			
 
				             Default: 'auto'.
			
 
				-        label_list (str | None, optional): Path of label_list. Default: None.
			
 
				+        label_list (str|None, optional): Path of label_list. Default: None.
			
 
				 
			
 
				     Returns:
			
 
				         list: List of samples.
			
--- a/tests/testing_utils.py
+++ b/tests/testing_utils.py
@@ -118,7 +118,7 @@ class _CommonTestNamespace:
 
				                 assertForFloat = self.assertTrue
			
 
				 
			
 
				             result_t = type(result)
			
 
				-            error_msg = 'Output has diff at place:{}. \nExpect: {} \nBut Got: {} in class {}'
			
 
				+            error_msg = "Output has diff at place:{}. \nExpect: {} \nBut Got: {} in class {}"
			
 
				             if result_t in [list, tuple]:
			
 
				                 result_t = get_container_type(result)
			
 
				             if result_t in [
			
@@ -144,8 +144,8 @@ class _CommonTestNamespace:
 
				                             result.shape, self.__class__.__name__))
			
 
				             else:
			
 
				                 raise ValueError(
			
 
				-                    'result type must be str, int, bool, set, np.bool, np.int32, '
			
 
				-                    'np.int64, np.str, float, np.ndarray, np.float32, np.float64'
			
 
				+                    "result type must be str, int, bool, set, np.bool, np.int32, "
			
 
				+                    "np.int64, np.str, float, np.ndarray, np.float32, np.float64"
			
 
				                 )
			
 
				 
			
 
				         def check_output_equal(self,
			
@@ -157,13 +157,13 @@ class _CommonTestNamespace:
 
				             Check whether result and expected result are equal, including shape. 
			
 
				             
			
 
				             Args:
			
 
				-                result: str, int, bool, set, np.ndarray.
			
 
				+                result (str|int|bool|set|np.ndarray):
			
 
				                     The result needs to be checked.
			
 
				-                expected_result: str, int, bool, set, np.ndarray. The type has to be same as result's.
			
 
				-                    Use the expected result to check result.
			
 
				-                rtol: float
			
 
				+                expected_result (str|int|bool|set|np.ndarray): The type has to be same as
			
 
				+                    result's. Use the expected result to check result.
			
 
				+                rtol (float, optional):
			
 
				                     relative tolerance, default 1.e-5.
			
 
				-                atol: float
			
 
				+                atol (float, optional):
			
 
				                     absolute tolerance, default 1.e-8
			
 
				             """
			
 
				 
			
@@ -178,13 +178,13 @@ class _CommonTestNamespace:
 
				             Check whether result and expected result are not equal, including shape. 
			
 
				 
			
 
				             Args:
			
 
				-                result: str, int, bool, set, np.ndarray.
			
 
				+                result (str|int|bool|set|np.ndarray):
			
 
				                     The result needs to be checked.
			
 
				-                expected_result: str, int, bool, set, np.ndarray. The type has to be same as result's.
			
 
				-                    Use the expected result to check result.
			
 
				-                rtol: float
			
 
				+                expected_result (str|int|bool|set|np.ndarray): The type has to be same 
			
 
				+                    as result's. Use the expected result to check result.
			
 
				+                rtol (float, optional):
			
 
				                     relative tolerance, default 1.e-5.
			
 
				-                atol: float
			
 
				+                atol (float, optional):
			
 
				                     absolute tolerance, default 1.e-8
			
 
				             """
			
 
				 
			
--- a/tools/coco_tools/json_AnnoSta.py
+++ b/tools/coco_tools/json_AnnoSta.py
@@ -11,7 +11,7 @@
 
				 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
			
 
				 # See the License for the specific language governing permissions and
			
 
				 # limitations under the License.
			
 
				-'''
			
 
				+"""
			
 
				 @File Description:
			
 
				 # json文件annotations信息，生成统计结果csv，对象框shape、对象看shape比例、对象框起始位置、对象结束位置、对象结束位置、对象类别、单个图像对象数量的分布
			
 
				 python ./coco_tools/json_AnnoSta.py \
			
@@ -24,7 +24,8 @@ python ./coco_tools/json_AnnoSta.py \
 
				     --png_cat_path=./anno_sta/annos_cat.png \
			
 
				     --png_objNum_path=./anno_sta/annos_objNum.png \
			
 
				     --get_relative=True
			
 
				-'''
			
 
				+"""
			
 
				+
			
 
				 import os
			
 
				 import json
			
 
				 import argparse
			
--- a/tools/coco_tools/json_Img2Json.py
+++ b/tools/coco_tools/json_Img2Json.py
@@ -11,14 +11,15 @@
 
				 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
			
 
				 # See the License for the specific language governing permissions and
			
 
				 # limitations under the License.
			
 
				-'''
			
 
				+"""
			
 
				 @File Description:
			
 
				 # 根据test影像文件夹生成test.json
			
 
				 python ./coco_tools/json_Img2Json.py \
			
 
				     --test_image_path=./test2017 \
			
 
				     --json_train_path=./annotations/instances_val2017.json \
			
 
				     --json_test_path=./test.json
			
 
				-'''
			
 
				+"""
			
 
				+
			
 
				 import os, cv2
			
 
				 import json
			
 
				 import argparse
			
--- a/tools/coco_tools/json_ImgSta.py
+++ b/tools/coco_tools/json_ImgSta.py
@@ -11,7 +11,7 @@
 
				 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
			
 
				 # See the License for the specific language governing permissions and
			
 
				 # limitations under the License.
			
 
				-'''
			
 
				+"""
			
 
				 @File Description:
			
 
				 # 统计json文件images信息，生成统计结果csv，同时生成图像shape、图像shape比例的二维分布图
			
 
				 python ./coco_tools/json_ImgSta.py \
			
@@ -19,7 +19,7 @@ python ./coco_tools/json_ImgSta.py \
 
				     --csv_path=./img_sta/images.csv \
			
 
				     --png_shape_path=./img_sta/images_shape.png \
			
 
				     --png_shapeRate_path=./img_sta/images_shapeRate.png
			
 
				-'''
			
 
				+"""
			
 
				 
			
 
				 import json
			
 
				 import argparse
			
--- a/tools/coco_tools/json_InfoShow.py
+++ b/tools/coco_tools/json_InfoShow.py
@@ -11,13 +11,13 @@
 
				 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
			
 
				 # See the License for the specific language governing permissions and
			
 
				 # limitations under the License.
			
 
				-'''
			
 
				+"""
			
 
				 @File Description:
			
 
				 # 输出json文件基本信息
			
 
				 python ./coco_tools/json_InfoShow.py \
			
 
				        --json_path=./annotations/instances_val2017.json \
			
 
				        --show_num 5
			
 
				-'''
			
 
				+"""
			
 
				 
			
 
				 import json
			
 
				 import argparse
			
--- a/tools/coco_tools/json_Merge.py
+++ b/tools/coco_tools/json_Merge.py
@@ -11,14 +11,14 @@
 
				 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
			
 
				 # See the License for the specific language governing permissions and
			
 
				 # limitations under the License.
			
 
				-'''
			
 
				+"""
			
 
				 @File Description:
			
 
				 # 合并json文件，可以通过merge_keys控制合并的字段, 默认合并'images', 'annotations'字段
			
 
				 python ./coco_tools/json_Merge.py \
			
 
				     --json1_path=./annotations/instances_train2017.json \
			
 
				     --json2_path=./annotations/instances_val2017.json \
			
 
				     --save_path=./instances_trainval2017.json
			
 
				-'''
			
 
				+"""
			
 
				 
			
 
				 import json
			
 
				 import argparse
			
--- a/tools/coco_tools/json_Split.py
+++ b/tools/coco_tools/json_Split.py
@@ -11,14 +11,14 @@
 
				 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
			
 
				 # See the License for the specific language governing permissions and
			
 
				 # limitations under the License.
			
 
				-'''
			
 
				+"""
			
 
				 @File Description:
			
 
				 # json数据集划分，可以通过val_split_rate、val_split_num控制划分比例或个数, keep_val_inTrain可以设定是否在train中保留val相关信息
			
 
				 python ./coco_tools/json_Split.py \
			
 
				     --json_all_path=./annotations/instances_val2017.json \
			
 
				     --json_train_path=./instances_val2017_train.json \
			
 
				     --json_val_path=./instances_val2017_val.json
			
 
				-'''
			
 
				+"""
			
 
				 
			
 
				 import json
			
 
				 import argparse
			
--- a/tools/match.py
+++ b/tools/match.py
@@ -22,7 +22,7 @@ from utils import Raster, raster2uint8, save_geotiff, time_it
 
				 

			
 
				 class MatchError(Exception):

			
 
				     def __str__(self):

			
 
				-        return "Cannot match two images."

			
 
				+        return "Cannot match the two images."

			
 
				 

			
 
				 

			
 
				 def _calcu_tf(im1, im2):

			
--- a/tools/utils/raster.py
+++ b/tools/utils/raster.py
@@ -48,21 +48,23 @@ def _get_type(type_name: str) -> int:
 
				 
			
 
				 class Raster:
			
 
				     def __init__(self,
			
 
				-                 path: Optional[str],
			
 
				+                 path: str,
			
 
				                  gdal_obj: Optional[gdal.Dataset]=None,
			
 
				                  band_list: Union[List[int], Tuple[int], None]=None,
			
 
				                  to_uint8: bool=False) -> None:
			
 
				         """
			
 
				-        Class of raster reader.
			
 
				+        Reader of raster files.
			
 
				         
			
 
				         Args:
			
 
				-            path (Optional[str]): Path of raster file.
			
 
				-            gdal_obj (Optional[Any], optional): GDAL dataset. Defaults to None.
			
 
				-            band_list (Union[List[int], Tuple[int], None], optional): 
			
 
				-                Select a set of bands (the band index starts from 1) or None (read all bands). Defaults to None.
			
 
				-            to_uint8 (bool, optional): 
			
 
				-                Whether to convert data type to uint8. Defaults to False.
			
 
				+            path (str): Path of raster file.
			
 
				+            gdal_obj (gdal.Dataset|None, optional): GDAL dataset. Defaults to None.
			
 
				+            band_list (list[int] | tuple[int] | None, optional): Select a set of 
			
 
				+                bands (the band index starts from 1). If None, read all bands. 
			
 
				+                Defaults to None.
			
 
				+            to_uint8 (bool, optional): Whether to convert data type to uint8. 
			
 
				+                Defaults to False.
			
 
				         """
			
 
				+
			
 
				         super(Raster, self).__init__()
			
 
				         if path is not None:
			
 
				             if osp.exists(path):
			
@@ -92,13 +94,15 @@ class Raster:
 
				         self._getType()
			
 
				 
			
 
				     def setBands(self, band_list: Union[List[int], Tuple[int], None]) -> None:
			
 
				-        """ 
			
 
				+        """
			
 
				         Set bands of data.
			
 
				         
			
 
				         Args:
			
 
				-            band_list (Union[List[int], Tuple[int], None]): 
			
 
				-                Select a set of bands (the band index starts from 1) or None (read all bands). Defaults to None.
			
 
				+            band_list (list[int] | tuple[int] | None, optional): Select a set of 
			
 
				+                bands (the band index starts from 1). If None, read all bands. 
			
 
				+                Defaults to None.
			
 
				         """
			
 
				+
			
 
				         if band_list is not None:
			
 
				             if len(band_list) > self.bands:
			
 
				                 raise ValueError(
			
@@ -113,18 +117,19 @@ class Raster:
 
				                  start_loc: Union[List[int], Tuple[int, int], None]=None,
			
 
				                  block_size: Union[List[int], Tuple[int, int]]=[512, 512]
			
 
				                  ) -> np.ndarray:
			
 
				-        """ 
			
 
				+        """
			
 
				         Fetch data in a ndarray.
			
 
				         
			
 
				         Args:
			
 
				-            start_loc (Union[List[int], Tuple[int], None], optional): 
			
 
				-                Coordinates of the upper left corner of the block. None value means returning full image.
			
 
				-            block_size (Union[List[int], Tuple[int]], optional): 
			
 
				-                Block size. Defaults to [512, 512].
			
 
				+            start_loc (list[int] | tuple[int] | None, optional): Coordinates of the 
			
 
				+                upper left corner of the block. None value means returning full image.
			
 
				+            block_size (list[int] | tuple[int], optional): Block size. 
			
 
				+                Defaults to [512, 512].
			
 
				 
			
 
				         Returns:
			
 
				             np.ndarray: data's ndarray.
			
 
				         """
			
 
				+
			
 
				         if self._src_data is not None:
			
 
				             if start_loc is None:
			
 
				                 return self._getArray()
			
--- a/tutorials/train/object_detection/faster_rcnn.py
+++ b/tutorials/train/object_detection/faster_rcnn.py
@@ -54,14 +54,14 @@ eval_transforms = T.Compose([
 
				 ])
			
 
				 
			
 
				 # 分别构建训练和验证所用的数据集
			
 
				-train_dataset = pdrs.datasets.VOCDetection(
			
 
				+train_dataset = pdrs.datasets.VOCDetDataset(
			
 
				     data_dir=DATA_DIR,
			
 
				     file_list=TRAIN_FILE_LIST_PATH,
			
 
				     label_list=LABEL_LIST_PATH,
			
 
				     transforms=train_transforms,
			
 
				     shuffle=True)
			
 
				 
			
 
				-eval_dataset = pdrs.datasets.VOCDetection(
			
 
				+eval_dataset = pdrs.datasets.VOCDetDataset(
			
 
				     data_dir=DATA_DIR,
			
 
				     file_list=EVAL_FILE_LIST_PATH,
			
 
				     label_list=LABEL_LIST_PATH,
			
--- a/tutorials/train/object_detection/ppyolo.py
+++ b/tutorials/train/object_detection/ppyolo.py
@@ -54,14 +54,14 @@ eval_transforms = T.Compose([
 
				 ])
			
 
				 
			
 
				 # 分别构建训练和验证所用的数据集
			
 
				-train_dataset = pdrs.datasets.VOCDetection(
			
 
				+train_dataset = pdrs.datasets.VOCDetDataset(
			
 
				     data_dir=DATA_DIR,
			
 
				     file_list=TRAIN_FILE_LIST_PATH,
			
 
				     label_list=LABEL_LIST_PATH,
			
 
				     transforms=train_transforms,
			
 
				     shuffle=True)
			
 
				 
			
 
				-eval_dataset = pdrs.datasets.VOCDetection(
			
 
				+eval_dataset = pdrs.datasets.VOCDetDataset(
			
 
				     data_dir=DATA_DIR,
			
 
				     file_list=EVAL_FILE_LIST_PATH,
			
 
				     label_list=LABEL_LIST_PATH,
			
--- a/tutorials/train/object_detection/ppyolotiny.py
+++ b/tutorials/train/object_detection/ppyolotiny.py
@@ -54,14 +54,14 @@ eval_transforms = T.Compose([
 
				 ])
			
 
				 
			
 
				 # 分别构建训练和验证所用的数据集
			
 
				-train_dataset = pdrs.datasets.VOCDetection(
			
 
				+train_dataset = pdrs.datasets.VOCDetDataset(
			
 
				     data_dir=DATA_DIR,
			
 
				     file_list=TRAIN_FILE_LIST_PATH,
			
 
				     label_list=LABEL_LIST_PATH,
			
 
				     transforms=train_transforms,
			
 
				     shuffle=True)
			
 
				 
			
 
				-eval_dataset = pdrs.datasets.VOCDetection(
			
 
				+eval_dataset = pdrs.datasets.VOCDetDataset(
			
 
				     data_dir=DATA_DIR,
			
 
				     file_list=EVAL_FILE_LIST_PATH,
			
 
				     label_list=LABEL_LIST_PATH,
			
--- a/tutorials/train/object_detection/ppyolov2.py
+++ b/tutorials/train/object_detection/ppyolov2.py
@@ -54,14 +54,14 @@ eval_transforms = T.Compose([
 
				 ])
			
 
				 
			
 
				 # 分别构建训练和验证所用的数据集
			
 
				-train_dataset = pdrs.datasets.VOCDetection(
			
 
				+train_dataset = pdrs.datasets.VOCDetDataset(
			
 
				     data_dir=DATA_DIR,
			
 
				     file_list=TRAIN_FILE_LIST_PATH,
			
 
				     label_list=LABEL_LIST_PATH,
			
 
				     transforms=train_transforms,
			
 
				     shuffle=True)
			
 
				 
			
 
				-eval_dataset = pdrs.datasets.VOCDetection(
			
 
				+eval_dataset = pdrs.datasets.VOCDetDataset(
			
 
				     data_dir=DATA_DIR,
			
 
				     file_list=EVAL_FILE_LIST_PATH,
			
 
				     label_list=LABEL_LIST_PATH,
			
--- a/tutorials/train/object_detection/yolov3.py
+++ b/tutorials/train/object_detection/yolov3.py
@@ -54,14 +54,14 @@ eval_transforms = T.Compose([
 
				 ])
			
 
				 
			
 
				 # 分别构建训练和验证所用的数据集
			
 
				-train_dataset = pdrs.datasets.VOCDetection(
			
 
				+train_dataset = pdrs.datasets.VOCDetDataset(
			
 
				     data_dir=DATA_DIR,
			
 
				     file_list=TRAIN_FILE_LIST_PATH,
			
 
				     label_list=LABEL_LIST_PATH,
			
 
				     transforms=train_transforms,
			
 
				     shuffle=True)
			
 
				 
			
 
				-eval_dataset = pdrs.datasets.VOCDetection(
			
 
				+eval_dataset = pdrs.datasets.VOCDetDataset(
			
 
				     data_dir=DATA_DIR,
			
 
				     file_list=EVAL_FILE_LIST_PATH,
			
 
				     label_list=LABEL_LIST_PATH,