123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265 |
- # Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
- #
- # Licensed under the Apache License, Version 2.0 (the "License");
- # you may not use this file except in compliance with the License.
- # You may obtain a copy of the License at
- #
- # http://www.apache.org/licenses/LICENSE-2.0
- #
- # Unless required by applicable law or agreed to in writing, software
- # distributed under the License is distributed on an "AS IS" BASIS,
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- # See the License for the specific language governing permissions and
- # limitations under the License.
- import os.path as osp
- from typing import List, Tuple, Union, Optional
- import numpy as np
- try:
- from osgeo import gdal
- except:
- import gdal
- from paddlers.transforms.functions import to_uint8 as raster2uint8
- def _get_type(type_name: str) -> int:
- if type_name in ["bool", "uint8"]:
- gdal_type = gdal.GDT_Byte
- elif type_name in ["int8", "int16"]:
- gdal_type = gdal.GDT_Int16
- elif type_name == "uint16":
- gdal_type = gdal.GDT_UInt16
- elif type_name == "int32":
- gdal_type = gdal.GDT_Int32
- elif type_name == "uint32":
- gdal_type = gdal.GDT_UInt32
- elif type_name in ["int64", "uint64", "float16", "float32"]:
- gdal_type = gdal.GDT_Float32
- elif type_name == "float64":
- gdal_type = gdal.GDT_Float64
- elif type_name == "complex64":
- gdal_type = gdal.GDT_CFloat64
- else:
- raise TypeError("Non-suported data type {}.".format(type_name))
- return gdal_type
- class Raster:
- def __init__(self,
- path: str,
- gdal_obj: Optional[gdal.Dataset]=None,
- band_list: Union[List[int], Tuple[int], None]=None,
- to_uint8: bool=False) -> None:
- """
- Reader of raster files.
-
- Args:
- path (str): Path of raster file.
- gdal_obj (gdal.Dataset|None, optional): GDAL dataset. Defaults to None.
- band_list (list[int] | tuple[int] | None, optional): Select a set of
- bands (the band index starts from 1). If None, read all bands.
- Defaults to None.
- to_uint8 (bool, optional): Whether to convert data type to uint8.
- Defaults to False.
- """
- super(Raster, self).__init__()
- if path is not None:
- if osp.exists(path):
- self.path = path
- self.ext_type = path.split(".")[-1]
- if self.ext_type.lower() in ["npy", "npz"]:
- self._src_data = None
- else:
- try:
- # raster format support in GDAL:
- # https://www.osgeo.cn/gdal/drivers/raster/index.html
- self._src_data = gdal.Open(path)
- except:
- raise TypeError("Unsupported data format: {}".format(
- self.ext_type))
- else:
- raise ValueError("The path {0} does not exist.".format(path))
- else:
- if gdal_obj is not None:
- self._src_data = gdal_obj
- else:
- raise ValueError(
- "At least one of `path` and `gdal_obj` is not None.")
- self.to_uint8 = to_uint8
- self._getInfo()
- self.setBands(band_list)
- self._getType()
- def setBands(self, band_list: Union[List[int], Tuple[int], None]) -> None:
- """
- Set bands of data.
-
- Args:
- band_list (list[int] | tuple[int] | None, optional): Select a set of
- bands (the band index starts from 1). If None, read all bands.
- Defaults to None.
- """
- if band_list is not None:
- if len(band_list) > self.bands:
- raise ValueError(
- "The lenght of band_list must be less than {0}.".format(
- str(self.bands)))
- if max(band_list) > self.bands or min(band_list) < 1:
- raise ValueError("The range of band_list must within [1, {0}].".
- format(str(self.bands)))
- self.band_list = band_list
- def getArray(self,
- start_loc: Union[List[int], Tuple[int, int], None]=None,
- block_size: Union[List[int], Tuple[int, int]]=[512, 512]
- ) -> np.ndarray:
- """
- Fetch data in a ndarray.
-
- Args:
- start_loc (list[int] | tuple[int] | None, optional): Coordinates of the
- upper left corner of the block. None value means returning full image.
- block_size (list[int] | tuple[int], optional): Block size.
- Defaults to [512, 512].
- Returns:
- np.ndarray: data's ndarray.
- """
- if self._src_data is not None:
- if start_loc is None:
- return self._getArray()
- else:
- return self._getBlock(start_loc, block_size)
- else:
- print("Numpy doesn't support blocking temporarily.")
- return self._getNumpy()
- def _getInfo(self) -> None:
- if self._src_data is not None:
- self.width = self._src_data.RasterXSize
- self.height = self._src_data.RasterYSize
- self.bands = self._src_data.RasterCount
- self.geot = self._src_data.GetGeoTransform()
- self.proj = self._src_data.GetProjection()
- else:
- d_img = self._getNumpy()
- d_shape = d_img.shape
- if len(d_shape) == 3:
- self.height, self.width, self.bands = d_shape
- else:
- self.height, self.width = d_shape
- self.bands = 1
- self.geot = None
- self.proj = None
- def _getType(self) -> None:
- d_name = self.getArray([0, 0], [1, 1]).dtype.name
- self.datatype = _get_type(d_name)
- def _getNumpy(self):
- ima = np.load(self.path)
- if self.band_list is not None:
- band_array = []
- for b in self.band_list:
- band_i = ima[:, :, b - 1]
- band_array.append(band_i)
- ima = np.stack(band_array, axis=0)
- return ima
- def _getArray(self,
- window: Union[None, List[int], Tuple[int, int, int, int]]=None
- ) -> np.ndarray:
- if self._src_data is None:
- raise ValueError("The raster is None.")
- if window is not None:
- xoff, yoff, xsize, ysize = window
- if self.band_list is None:
- if window is None:
- ima = self._src_data.ReadAsArray()
- else:
- ima = self._src_data.ReadAsArray(xoff, yoff, xsize, ysize)
- else:
- band_array = []
- for b in self.band_list:
- if window is None:
- band_i = self._src_data.GetRasterBand(b).ReadAsArray()
- else:
- band_i = self._src_data.GetRasterBand(b).ReadAsArray(
- xoff, yoff, xsize, ysize)
- band_array.append(band_i)
- ima = np.stack(band_array, axis=0)
- if self.bands == 1:
- if len(ima.shape) == 3:
- ima = ima.squeeze(0)
- # the type is complex means this is a SAR data
- if isinstance(type(ima[0, 0]), complex):
- ima = abs(ima)
- else:
- ima = ima.transpose((1, 2, 0))
- if self.to_uint8 is True:
- ima = raster2uint8(ima)
- return ima
- def _getBlock(self,
- start_loc: Union[List[int], Tuple[int, int]],
- block_size: Union[List[int], Tuple[int, int]]=[512, 512]
- ) -> np.ndarray:
- if len(start_loc) != 2 or len(block_size) != 2:
- raise ValueError("The length start_loc/block_size must be 2.")
- xoff, yoff = start_loc
- xsize, ysize = block_size
- if (xoff < 0 or xoff > self.width) or (yoff < 0 or yoff > self.height):
- raise ValueError("start_loc must be within [0-{0}, 0-{1}].".format(
- str(self.width), str(self.height)))
- if xoff + xsize > self.width:
- xsize = self.width - xoff
- if yoff + ysize > self.height:
- ysize = self.height - yoff
- ima = self._getArray([int(xoff), int(yoff), int(xsize), int(ysize)])
- h, w = ima.shape[:2] if len(ima.shape) == 3 else ima.shape
- if self.bands != 1:
- tmp = np.zeros(
- (block_size[0], block_size[1], self.bands), dtype=ima.dtype)
- tmp[:h, :w, :] = ima
- else:
- tmp = np.zeros((block_size[0], block_size[1]), dtype=ima.dtype)
- tmp[:h, :w] = ima
- return tmp
- def save_geotiff(image: np.ndarray,
- save_path: str,
- proj: str,
- geotf: Tuple,
- use_type: Optional[int]=None,
- clear_ds: bool=True) -> None:
- if len(image.shape) == 2:
- height, width = image.shape
- channel = 1
- else:
- height, width, channel = image.shape
- if use_type is not None:
- data_type = use_type
- else:
- data_type = _get_type(image.dtype.name)
- driver = gdal.GetDriverByName("GTiff")
- dst_ds = driver.Create(save_path, width, height, channel, data_type)
- dst_ds.SetGeoTransform(geotf)
- dst_ds.SetProjection(proj)
- if channel > 1:
- for i in range(channel):
- band = dst_ds.GetRasterBand(i + 1)
- band.WriteArray(image[:, :, i])
- dst_ds.FlushCache()
- else:
- band = dst_ds.GetRasterBand(1)
- band.WriteArray(image)
- dst_ds.FlushCache()
- if clear_ds:
- dst_ds = None
- return dst_ds
|