PyPI - python-wml - Versions diffs - 3.0.0__py3-none-any.whl - Mend

python-wml 3.0.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of python-wml might be problematic. Click here for more details.

Files changed (164) hide show

python_wml-3.0.0.dist-info/LICENSE +23 -0
python_wml-3.0.0.dist-info/METADATA +51 -0
python_wml-3.0.0.dist-info/RECORD +164 -0
python_wml-3.0.0.dist-info/WHEEL +5 -0
python_wml-3.0.0.dist-info/top_level.txt +1 -0
wml/__init__.py +0 -0
wml/basic_data_def/__init__.py +2 -0
wml/basic_data_def/detection_data_def.py +279 -0
wml/basic_data_def/io_data_def.py +2 -0
wml/basic_img_utils.py +816 -0
wml/img_patch.py +92 -0
wml/img_utils.py +571 -0
wml/iotoolkit/__init__.py +17 -0
wml/iotoolkit/aic_keypoint.py +115 -0
wml/iotoolkit/baidu_mask_toolkit.py +244 -0
wml/iotoolkit/base_dataset.py +210 -0
wml/iotoolkit/bboxes_statistics.py +515 -0
wml/iotoolkit/build.py +0 -0
wml/iotoolkit/cityscapes_toolkit.py +183 -0
wml/iotoolkit/classification_data_statistics.py +25 -0
wml/iotoolkit/coco_data_fwd.py +225 -0
wml/iotoolkit/coco_keypoints.py +118 -0
wml/iotoolkit/coco_keypoints_fmt2.py +103 -0
wml/iotoolkit/coco_toolkit.py +397 -0
wml/iotoolkit/coco_wholebody.py +269 -0
wml/iotoolkit/common.py +108 -0
wml/iotoolkit/crowd_pose.py +146 -0
wml/iotoolkit/fast_labelme.py +110 -0
wml/iotoolkit/image_folder.py +95 -0
wml/iotoolkit/imgs_cache.py +58 -0
wml/iotoolkit/imgs_reader_mt.py +73 -0
wml/iotoolkit/labelme_base.py +102 -0
wml/iotoolkit/labelme_json_to_img.py +49 -0
wml/iotoolkit/labelme_toolkit.py +117 -0
wml/iotoolkit/labelme_toolkit_fwd.py +733 -0
wml/iotoolkit/labelmemckeypoints_dataset.py +169 -0
wml/iotoolkit/lspet.py +48 -0
wml/iotoolkit/mapillary_vistas_toolkit.py +269 -0
wml/iotoolkit/mat_data.py +90 -0
wml/iotoolkit/mckeypoints_statistics.py +28 -0
wml/iotoolkit/mot_datasets.py +62 -0
wml/iotoolkit/mpii.py +108 -0
wml/iotoolkit/npmckeypoints_dataset.py +164 -0
wml/iotoolkit/o365_to_coco.py +136 -0
wml/iotoolkit/object365_toolkit.py +156 -0
wml/iotoolkit/object365v2_toolkit.py +71 -0
wml/iotoolkit/pascal_voc_data.py +51 -0
wml/iotoolkit/pascal_voc_toolkit.py +194 -0
wml/iotoolkit/pascal_voc_toolkit_fwd.py +473 -0
wml/iotoolkit/penn_action.py +57 -0
wml/iotoolkit/rawframe_dataset.py +129 -0
wml/iotoolkit/rewrite_pascal_voc.py +28 -0
wml/iotoolkit/semantic_data.py +49 -0
wml/iotoolkit/split_file_by_type.py +29 -0
wml/iotoolkit/sports_mot_datasets.py +78 -0
wml/iotoolkit/vis_objectdetection_dataset.py +70 -0
wml/iotoolkit/vis_torch_data.py +39 -0
wml/iotoolkit/yolo_toolkit.py +38 -0
wml/object_detection2/__init__.py +4 -0
wml/object_detection2/basic_visualization.py +37 -0
wml/object_detection2/bboxes.py +812 -0
wml/object_detection2/data_process_toolkit.py +146 -0
wml/object_detection2/keypoints.py +292 -0
wml/object_detection2/mask.py +120 -0
wml/object_detection2/metrics/__init__.py +3 -0
wml/object_detection2/metrics/build.py +15 -0
wml/object_detection2/metrics/classifier_toolkit.py +440 -0
wml/object_detection2/metrics/common.py +71 -0
wml/object_detection2/metrics/mckps_toolkit.py +338 -0
wml/object_detection2/metrics/toolkit.py +1953 -0
wml/object_detection2/npod_toolkit.py +361 -0
wml/object_detection2/odtools.py +243 -0
wml/object_detection2/standard_names.py +75 -0
wml/object_detection2/visualization.py +956 -0
wml/object_detection2/wmath.py +34 -0
wml/semantic/__init__.py +0 -0
wml/semantic/basic_toolkit.py +65 -0
wml/semantic/mask_utils.py +156 -0
wml/semantic/semantic_test.py +21 -0
wml/semantic/structures.py +1 -0
wml/semantic/toolkit.py +105 -0
wml/semantic/visualization_utils.py +658 -0
wml/threadtoolkit.py +50 -0
wml/walgorithm.py +228 -0
wml/wcollections.py +212 -0
wml/wfilesystem.py +487 -0
wml/wml_utils.py +657 -0
wml/wstructures/__init__.py +4 -0
wml/wstructures/common.py +9 -0
wml/wstructures/keypoints_train_toolkit.py +149 -0
wml/wstructures/kps_structures.py +579 -0
wml/wstructures/mask_structures.py +1161 -0
wml/wtorch/__init__.py +8 -0
wml/wtorch/bboxes.py +104 -0
wml/wtorch/classes_suppression.py +24 -0
wml/wtorch/conv_module.py +181 -0
wml/wtorch/conv_ws.py +144 -0
wml/wtorch/data/__init__.py +16 -0
wml/wtorch/data/_utils/__init__.py +45 -0
wml/wtorch/data/_utils/collate.py +183 -0
wml/wtorch/data/_utils/fetch.py +47 -0
wml/wtorch/data/_utils/pin_memory.py +121 -0
wml/wtorch/data/_utils/signal_handling.py +72 -0
wml/wtorch/data/_utils/worker.py +227 -0
wml/wtorch/data/base_data_loader_iter.py +93 -0
wml/wtorch/data/dataloader.py +501 -0
wml/wtorch/data/datapipes/__init__.py +1 -0
wml/wtorch/data/datapipes/iter/__init__.py +12 -0
wml/wtorch/data/datapipes/iter/batch.py +126 -0
wml/wtorch/data/datapipes/iter/callable.py +92 -0
wml/wtorch/data/datapipes/iter/listdirfiles.py +37 -0
wml/wtorch/data/datapipes/iter/loadfilesfromdisk.py +30 -0
wml/wtorch/data/datapipes/iter/readfilesfromtar.py +60 -0
wml/wtorch/data/datapipes/iter/readfilesfromzip.py +63 -0
wml/wtorch/data/datapipes/iter/sampler.py +94 -0
wml/wtorch/data/datapipes/utils/__init__.py +0 -0
wml/wtorch/data/datapipes/utils/common.py +65 -0
wml/wtorch/data/dataset.py +354 -0
wml/wtorch/data/datasets/__init__.py +4 -0
wml/wtorch/data/datasets/common.py +53 -0
wml/wtorch/data/datasets/listdirfilesdataset.py +36 -0
wml/wtorch/data/datasets/loadfilesfromdiskdataset.py +30 -0
wml/wtorch/data/distributed.py +135 -0
wml/wtorch/data/multi_processing_data_loader_iter.py +866 -0
wml/wtorch/data/sampler.py +267 -0
wml/wtorch/data/single_process_data_loader_iter.py +24 -0
wml/wtorch/data/test_data_loader.py +26 -0
wml/wtorch/dataset_toolkit.py +67 -0
wml/wtorch/depthwise_separable_conv_module.py +98 -0
wml/wtorch/dist.py +591 -0
wml/wtorch/dropblock/__init__.py +6 -0
wml/wtorch/dropblock/dropblock.py +228 -0
wml/wtorch/dropblock/dropout.py +40 -0
wml/wtorch/dropblock/scheduler.py +48 -0
wml/wtorch/ema.py +61 -0
wml/wtorch/fc_module.py +73 -0
wml/wtorch/functional.py +34 -0
wml/wtorch/iter_dataset.py +26 -0
wml/wtorch/loss.py +69 -0
wml/wtorch/nets/__init__.py +0 -0
wml/wtorch/nets/ckpt_toolkit.py +219 -0
wml/wtorch/nets/fpn.py +276 -0
wml/wtorch/nets/hrnet/__init__.py +0 -0
wml/wtorch/nets/hrnet/config.py +2 -0
wml/wtorch/nets/hrnet/hrnet.py +494 -0
wml/wtorch/nets/misc.py +249 -0
wml/wtorch/nets/resnet/__init__.py +0 -0
wml/wtorch/nets/resnet/layers/__init__.py +17 -0
wml/wtorch/nets/resnet/layers/aspp.py +144 -0
wml/wtorch/nets/resnet/layers/batch_norm.py +231 -0
wml/wtorch/nets/resnet/layers/blocks.py +111 -0
wml/wtorch/nets/resnet/layers/wrappers.py +110 -0
wml/wtorch/nets/resnet/r50_config.py +38 -0
wml/wtorch/nets/resnet/resnet.py +691 -0
wml/wtorch/nets/shape_spec.py +20 -0
wml/wtorch/nets/simple_fpn.py +101 -0
wml/wtorch/nms.py +109 -0
wml/wtorch/nn.py +896 -0
wml/wtorch/ocr_block.py +193 -0
wml/wtorch/summary.py +331 -0
wml/wtorch/train_toolkit.py +603 -0
wml/wtorch/transformer_blocks.py +266 -0
wml/wtorch/utils.py +719 -0
wml/wtorch/wlr_scheduler.py +100 -0

wml/basic_img_utils.py ADDED Viewed

@@ -0,0 +1,816 @@
+import numpy as np
+from collections import OrderedDict, Iterable
+import copy
+import cv2
+import math
+import wml.walgorithm as wa
+BASE_IMG_SUFFIX=".jpg;;.jpeg;;.bmp;;.png;;.gif;;.tif"
+def normal_image(image,min_v=0,max_v=255,dtype=np.uint8):
+    if not isinstance(image,np.ndarray):
+        image = np.array(image)
+    t = image.dtype
+    if t!=np.float32:
+        image = image.astype(np.float32)
+    i_min = np.min(image)
+    i_max = np.max(image)
+    image = (image-float(i_min))*float(max_v-min_v)/max(float(i_max-i_min),1e-8)+float(min_v)
+    if dtype!=np.float32:
+        image = image.astype(dtype)
+    return image
+def _get_translate_matrix(offset, direction='horizontal'):
+    """Generate the translate matrix.
+    Args:
+        offset (int | float): The offset used for translate.
+        direction (str): The translate direction, either
+            "horizontal" or "vertical".
+    Returns:
+        ndarray: The translate matrix with dtype float32.
+    """
+    if direction == 'horizontal':
+        translate_matrix = np.float32([[1, 0, offset], [0, 1, 0]])
+    elif direction == 'vertical':
+        translate_matrix = np.float32([[1, 0, 0], [0, 1, offset]])
+    return translate_matrix
+def _get_shear_matrix(magnitude, direction='horizontal'):
+    """Generate the shear matrix for transformation.
+    Args:
+        magnitude (int | float): The magnitude used for shear.
+        direction (str): The flip direction, either "horizontal"
+            or "vertical".
+    Returns:
+        ndarray: The shear matrix with dtype float32.
+    """
+    if direction == 'horizontal':
+        shear_matrix = np.float32([[1, magnitude, 0], [0, 1, 0]])
+    elif direction == 'vertical':
+        shear_matrix = np.float32([[1, 0, 0], [magnitude, 1, 0]])
+    return shear_matrix
+cv2_interp_codes = {
+    'nearest': cv2.INTER_NEAREST,
+    'bilinear': cv2.INTER_LINEAR,
+    'bicubic': cv2.INTER_CUBIC,
+    'area': cv2.INTER_AREA,
+    'lanczos': cv2.INTER_LANCZOS4
+}
+'''
+box:ymin,xmin,ymax,xmax, absolute corrdinate
+'''
+def crop_img_absolute(img,box):
+    shape = img.shape
+    box = np.array(box)
+    box[0:4:2] = np.minimum(box[0:4:2],shape[0])
+    box[1:4:2] = np.minimum(box[1:4:2],shape[1])
+    box = np.maximum(box,0)
+    ymin = box[0]
+    ymax = box[2]
+    xmin = box[1]
+    xmax = box[3]
+    if len(shape)==2:
+        return img[ymin:ymax,xmin:xmax]
+    else:
+        return img[ymin:ymax,xmin:xmax,:]
+'''
+box:xmin,ymin,xmax,ymax, absolute corrdinate
+img:[H,W,C]
+'''
+def crop_img_absolute_xy(img,box):
+    shape = img.shape
+    box = np.array(box)
+    box[0:4:2] = np.minimum(box[0:4:2],shape[1])
+    box[1:4:2] = np.minimum(box[1:4:2],shape[0])
+    box = np.maximum(box,0)
+    ymin = box[1]
+    ymax = box[3]
+    xmin = box[0]
+    xmax = box[2]
+    return img[ymin:ymax,xmin:xmax]
+'''
+box:ymin,xmin,ymax,xmax, relative corrdinate
+'''
+def crop_img(img,box):
+    shape = img.shape
+    box = np.array(box)
+    box = np.minimum(box,1.0)
+    box = np.maximum(box,0.0)
+    ymin = int((shape[0])*box[0]+0.5)
+    ymax = int((shape[0])*box[2]+1+0.5)
+    xmin = int((shape[1])*box[1]+0.5)
+    xmax = int((shape[1])*box[3]+1+0.5)
+    if len(shape)==2:
+        return img[ymin:ymax,xmin:xmax]
+    else:
+        return img[ymin:ymax,xmin:xmax,:]
+'''
+box:xmin,ymin,xmax,ymax, absolute corrdinate
+img: [B,C,H,W]
+'''
+def crop_batch_img_absolute_xy(img,box):
+    shape = img.shape
+    box = np.array(box)
+    box[0:4:2] = np.minimum(box[0:4:2],shape[-1])
+    box[1:4:2] = np.minimum(box[1:4:2],shape[-2])
+    box = np.maximum(box,0)
+    ymin = box[1]
+    ymax = box[3]
+    xmin = box[0]
+    xmax = box[2]
+    return img[:,:,ymin:ymax,xmin:xmax]
+def set_subimg(img,sub_img,p0):
+    '''
+    p0:(x,y)
+    '''
+    img[p0[1]:p0[1]+sub_img.shape[0],p0[0]:p0[0]+sub_img.shape[1]] = sub_img
+    return img
+'''
+box:xmin,ymin,xmax,ymax, absolute corrdinate
+size: (w,h)
+'''
+def crop_and_pad(img,bbox,size=None,pad_color=127):
+    if size is None:
+        size = (bbox[2]-bbox[0],bbox[3]-bbox[1])
+    img = crop_img_absolute_xy(img,bbox)
+    channels = img.shape[-1]
+    if img.shape[0]<size[1] or img.shape[1]<size[0]:
+        res = np.ones([size[1],size[0],3],dtype=img.dtype)
+        if not isinstance(pad_color,Iterable):
+            pad_color = (pad_color,)*channels
+        pad_color = np.array(list(pad_color),dtype=img.dtype)
+        pad_color = pad_color.reshape([1,1,channels])
+        res = res*pad_color
+        offset_x = 0
+        offset_y = 0
+        w = img.shape[1]
+        h = img.shape[0]
+        res[offset_y:offset_y+h,offset_x:offset_x+w,:] = img
+        return res
+    else:
+        return img
+def align_pad(img,align=32,value=127):
+    size = list(img.shape)
+    size[0] = (size[0]+align-1)//align*align
+    size[1] = (size[1]+align-1)//align*align
+    res = np.ones([size[0],size[1],3],dtype=img.dtype)*value
+    w = img.shape[1]
+    h = img.shape[0]
+    res[:h,:w,:] = img
+    return res
+'''
+box:ymin,xmin,ymax,xmax, absolute corrdinate
+mask: [NR,H,W]
+'''
+def crop_masks_absolute(masks,box):
+    shape = masks.shape[1:]
+    box = np.array(box)
+    box[0:4:2] = np.minimum(box[0:4:2],shape[0])
+    box[1:4:2] = np.minimum(box[1:4:2],shape[1])
+    box = np.maximum(box,0)
+    ymin = box[0]
+    ymax = box[2]
+    xmin = box[1]
+    xmax = box[3]
+    return masks[:,ymin:ymax,xmin:xmax]
+'''
+box:xmin,ymin,xmax,ymax, absolute corrdinate
+mask: [NR,H,W]
+'''
+def crop_masks_absolute_xy(img,box):
+    new_box = [box[1],box[0],box[3],box[2]]
+    return crop_masks_absolute(img,new_box)
+'''
+img:[H,W]/[H,W,C]
+rect:[ymin,xmin,ymax,xmax] absolute coordinate
+与crop_img类似，但如果rect超出img边界会先pad再剪切
+'''
+def sub_image(img,rect,pad_value=127):
+    if rect[0]<0 or rect[1]<0 or rect[2]>img.shape[0] or rect[3]>img.shape[1]:
+        py0 = -rect[0] if rect[0]<0 else 0
+        py1 = rect[2]-img.shape[0] if rect[2]>img.shape[0] else 0
+        px0 = -rect[1] if rect[1] < 0 else 0
+        px1 = rect[3] - img.shape[1] if rect[3] > img.shape[1] else 0
+        img = np.pad(img,[[py0,py1],[px0,px1],[0,0]],constant_values=pad_value)
+        rect[0] += py0
+        rect[1] += px0
+        rect[2] += py0
+        rect[3] += px0
+    return copy.deepcopy(img[rect[0]:rect[2],rect[1]:rect[3]])
+'''
+img:[H,W]/[H,W,C]
+rect:[N,4] [ymin,xmin,ymax,xmax] absolute coordinate
+'''
+def sub_images(img,rects):
+    res = []
+    for rect in rects:
+        res.append(sub_image(img,rect))
+    return res
+'''
+img:[H,W]/[H,W,C]
+rect:[xmin,ymin,xmax,ymax] absolute coordinate
+'''
+def sub_imagev2(img,rect,pad_value=127):
+    return sub_image(img,[rect[1],rect[0],rect[3],rect[2]],pad_value=pad_value)
+'''
+img: [H,W,C]
+size: [w,h]
+'''
+def center_crop(img,size,pad_value=127):
+    cx = img.shape[1]//2
+    cy = img.shape[0]//2
+    x0 = cx-size[0]//2
+    y0 = cy-size[1]//2
+    x1 = x0+size[0]
+    y1 = y0+size[1]
+    return sub_image(img,[y0,x0,y1,x1],pad_value=pad_value)
+def past_img(dst_img,src_img,pos):
+    '''
+    dst_img: [H,W,C]
+    src_img: [h,w,C]
+    pos: [x,y], 粘贴区域的左上角
+    '''
+    x,y = pos
+    dst_img[y:y+src_img.shape[0],x:x+src_img.shape[1]] = src_img
+    return dst_img
+def crop_and_past_img(dst_img,src_img,src_bbox,pos):
+    '''
+    src_box:xmin,ymin,xmax,ymax, absolute corrdinate
+    pos: [x,y], 粘贴区域的左上角
+    '''
+    src_img = crop_img_absolute_xy(src_img,src_bbox)
+    return past_img(dst_img,src_img,pos)
+def imrotate(img,
+             angle,
+             center=None,
+             scale=1.0,
+             border_value=0,
+             interpolation='bilinear',
+             auto_bound=False):
+    """Rotate an image.
+    Args:
+        img (ndarray): Image to be rotated.
+        angle (float): Rotation angle in degrees, positive values mean
+            clockwise rotation.
+        center (tuple[float], optional): Center point (w, h) of the rotation in
+            the source image. If not specified, the center of the image will be
+            used.
+        scale (float): Isotropic scale factor.
+        border_value (int): Border value.
+        interpolation (str): Same as :func:`resize`.
+        auto_bound (bool): Whether to adjust the image size to cover the whole
+            rotated image.
+    Returns:
+        ndarray: The rotated image.
+    """
+    if center is not None and auto_bound:
+        raise ValueError('`auto_bound` conflicts with `center`')
+    h, w = img.shape[:2]
+    if center is None:
+        center = ((w - 1) * 0.5, (h - 1) * 0.5)
+    assert isinstance(center, tuple)
+    matrix = cv2.getRotationMatrix2D(center, -angle, scale)
+    if auto_bound:
+        cos = np.abs(matrix[0, 0])
+        sin = np.abs(matrix[0, 1])
+        new_w = h * sin + w * cos
+        new_h = h * cos + w * sin
+        matrix[0, 2] += (new_w - w) * 0.5
+        matrix[1, 2] += (new_h - h) * 0.5
+        w = int(np.round(new_w))
+        h = int(np.round(new_h))
+    rotated = cv2.warpAffine(
+        img,
+        matrix, (w, h),
+        flags=cv2_interp_codes[interpolation],
+        borderValue=border_value)
+    return rotated
+def imtranslate(img,
+                offset,
+                direction='horizontal',
+                border_value=0,
+                interpolation='bilinear'):
+    """Translate an image.
+    Args:
+        img (ndarray): Image to be translated with format
+            (h, w) or (h, w, c).
+        offset (int | float): The offset used for translate.
+        direction (str): The translate direction, either "horizontal"
+            or "vertical".
+        border_value (int | tuple[int]): Value used in case of a
+            constant border.
+        interpolation (str): Same as :func:`resize`.
+    Returns:
+        ndarray: The translated image.
+    """
+    assert direction in ['horizontal',
+                         'vertical'], f'Invalid direction: {direction}'
+    height, width = img.shape[:2]
+    if img.ndim == 2:
+        channels = 1
+    elif img.ndim == 3:
+        channels = img.shape[-1]
+    if isinstance(border_value, int):
+        border_value = tuple([border_value] * channels)
+    elif isinstance(border_value, tuple):
+        assert len(border_value) == channels, \
+            'Expected the num of elements in tuple equals the channels' \
+            'of input image. Found {} vs {}'.format(
+                len(border_value), channels)
+    else:
+        raise ValueError(
+            f'Invalid type {type(border_value)} for `border_value`.')
+    translate_matrix = _get_translate_matrix(offset, direction)
+    translated = cv2.warpAffine(
+        img,
+        translate_matrix,
+        (width, height),
+        # Note case when the number elements in `border_value`
+        # greater than 3 (e.g. translating masks whose channels
+        # large than 3) will raise TypeError in `cv2.warpAffine`.
+        # Here simply slice the first 3 values in `border_value`.
+        borderValue=border_value[:3],
+        flags=cv2_interp_codes[interpolation])
+    return translated
+def imshear(img,
+            magnitude,
+            direction='horizontal',
+            border_value=0,
+            interpolation='bilinear'):
+    """Shear an image.
+    Args:
+        img (ndarray): Image to be sheared with format (h, w)
+            or (h, w, c).
+        magnitude (int | float): The magnitude used for shear.
+        direction (str): The flip direction, either "horizontal"
+            or "vertical".
+        border_value (int | tuple[int]): Value used in case of a
+            constant border.
+        interpolation (str): Same as :func:`resize`.
+    Returns:
+        ndarray: The sheared image.
+    """
+    assert direction in ['horizontal',
+                         'vertical'], f'Invalid direction: {direction}'
+    height, width = img.shape[:2]
+    if img.ndim == 2:
+        channels = 1
+    elif img.ndim == 3:
+        channels = img.shape[-1]
+    if isinstance(border_value, int):
+        border_value = tuple([border_value] * channels)
+    elif isinstance(border_value, tuple):
+        assert len(border_value) == channels, \
+            'Expected the num of elements in tuple equals the channels' \
+            'of input image. Found {} vs {}'.format(
+                len(border_value), channels)
+    else:
+        raise ValueError(
+            f'Invalid type {type(border_value)} for `border_value`')
+    shear_matrix = _get_shear_matrix(magnitude, direction)
+    sheared = cv2.warpAffine(
+        img,
+        shear_matrix,
+        (width, height),
+        # Note case when the number elements in `border_value`
+        # greater than 3 (e.g. shearing masks whose channels large
+        # than 3) will raise TypeError in `cv2.warpAffine`.
+        # Here simply slice the first 3 values in `border_value`.
+        borderValue=border_value[:3],
+        flags=cv2_interp_codes[interpolation])
+    return sheared
+def im_warp_affine(img,
+             M,
+             border_value=0,
+             interpolation='bilinear',
+             out_shape = None,
+             ):
+    '''
+    out_shape:[W,H]
+    '''
+    if out_shape is None:
+        h,w = img.shape[:2]
+        out_shape = (w,h)
+    rotated = cv2.warpAffine(
+        img,
+        M, out_shape,
+        flags=cv2_interp_codes[interpolation],
+        borderValue=border_value)
+    return rotated
+def imflip(img, direction='horizontal'):
+    """Flip an image horizontally or vertically.
+    Args:
+        img (ndarray): Image to be flipped.
+        direction (str): The flip direction, either "horizontal" or
+            "vertical" or "diagonal".
+    Returns:
+        ndarray: The flipped image.
+    """
+    assert direction in ['horizontal', 'vertical', 'diagonal']
+    if direction == 'horizontal':
+        return np.flip(img, axis=1)
+    elif direction == 'vertical':
+        return np.flip(img, axis=0)
+    else:
+        return np.flip(img, axis=(0, 1))
+'''
+size:(w,h)
+return:
+ resized img, resized_img.size <= size
+'''
+def resize_img(img,size,keep_aspect_ratio=False,interpolation=cv2.INTER_LINEAR,align=None):
+    img_shape = img.shape
+    if size[0] == img.shape[1] and size[1]==img.shape[0]:
+        return img
+    if np.any(np.array(img_shape)==0):
+        img_shape = list(img_shape)
+        img_shape[0] = size[1]
+        img_shape[1] = size[0]
+        return np.zeros(img_shape,dtype=img.dtype)
+    if keep_aspect_ratio:
+        if size[1]*img_shape[1] != size[0]*img_shape[0]:
+            if size[1]*img_shape[1]>size[0]*img_shape[0]:
+                ratio = size[0]/img_shape[1]
+            else:
+                ratio = size[1]/img_shape[0]
+            size = list(copy.deepcopy(size))
+            size[0] = int(img_shape[1]*ratio)
+            size[1] = int(img_shape[0]*ratio)
+            if align:
+                size[0] = (size[0]+align-1)//align*align
+                size[1] = (size[1] + align - 1) // align * align
+    if not isinstance(size,tuple):
+        size = tuple(size)
+    if size[0]==img_shape[0] and size[1]==img_shape[1]:
+        return img
+    img = cv2.resize(img,dsize=size,interpolation=interpolation)
+    if len(img_shape)==3 and len(img.shape)==2:
+        img = np.expand_dims(img,axis=-1)
+    return img
+def resize_imgv2(img,size,interpolation=cv2.INTER_LINEAR,return_scale=False,align=None):
+    '''
+    size: (w,h)
+    '''
+    old_shape = img.shape
+    img = resize_img(img,size,keep_aspect_ratio=True,interpolation=interpolation)
+    if return_scale:
+        r = img.shape[0]/max(old_shape[0],1)
+    if align is not None:
+        img = align_pad(img,align=align)
+    if return_scale:
+        return img,r
+    else:
+        return img
+def resize_imgv3(img,size,interpolation=cv2.INTER_LINEAR,return_scale=False,align=None,keep_aspect_ratio=True):
+    '''
+    size: (w,h)
+    '''
+    old_shape = img.shape
+    img = resize_img(img,size,keep_aspect_ratio=keep_aspect_ratio,interpolation=interpolation)
+    if return_scale:
+        r = (img.shape[1]/max(old_shape[1],1),img.shape[0]/max(old_shape[0],1)) #(w,h) scale
+    if align is not None:
+        img = align_pad(img,align=align)
+    if return_scale:
+        return img,r
+    else:
+        return img
+def resize_height(img,h,interpolation=cv2.INTER_LINEAR):
+    shape = img.shape
+    new_h = h
+    new_w = int(shape[1]*new_h/shape[0])
+    return cv2.resize(img,dsize=(new_w,new_h),interpolation=interpolation)
+def resize_width(img,w,interpolation=cv2.INTER_LINEAR):
+    shape = img.shape
+    new_w = w
+    new_h = int(shape[0]*new_w/shape[1])
+    return cv2.resize(img,dsize=(new_w,new_h),interpolation=interpolation)
+def resize_short_size(img,size,interpolation=cv2.INTER_LINEAR):
+    shape = img.shape
+    if shape[0]<shape[1]:
+        return resize_height(img,size,interpolation)
+    else:
+        return resize_width(img,size,interpolation)
+def resize_long_size(img,size,interpolation=cv2.INTER_LINEAR):
+    shape = img.shape
+    if shape[0]>shape[1]:
+        return resize_height(img,size,interpolation)
+    else:
+        return resize_width(img,size,interpolation)
+'''
+size:(w,h)
+return:
+img,r
+r = new_size/old_size
+'''
+def resize_and_pad(img,size,interpolation=cv2.INTER_LINEAR,pad_color=(0,0,0),center_pad=True,return_scale=False):
+    old_shape = img.shape
+    img = resize_img(img,size,keep_aspect_ratio=True,interpolation=interpolation)
+    if return_scale:
+        r = img.shape[0]/max(old_shape[0],1)
+    if img.shape[0] == size[1] and img.shape[1] == size[0]:
+        if return_scale:
+            return img,r
+        return img
+    else:
+        if len(img.shape)==3:
+            channels = img.shape[-1]
+            if not isinstance(pad_color,Iterable):
+                pad_color = [pad_color]*channels
+            res = np.ones([size[1],size[0],channels],dtype=img.dtype)
+            pad_color = np.array(list(pad_color),dtype=img.dtype)
+            pad_color = pad_color.reshape([1,1,channels])
+        else:
+            if not isinstance(pad_color,Iterable):
+                pad_color = [pad_color]
+            res = np.ones([size[1],size[0]],dtype=img.dtype)
+            pad_color = np.array(list(pad_color),dtype=img.dtype)
+            pad_color = pad_color.reshape([1,1])
+        res = res*pad_color
+        if center_pad:
+            offset_x = (size[0]-img.shape[1])//2
+            offset_y = (size[1]-img.shape[0])//2
+        else:
+            offset_x = 0
+            offset_y = 0
+        w = img.shape[1]
+        h = img.shape[0]
+        res[offset_y:offset_y+h,offset_x:offset_x+w] = img
+        if return_scale:
+            return res,r
+        else:
+            return res
+def rotate_img(img,angle,scale=1.0,border_value=0,dsize=None,center=None,interpolation=cv2.INTER_LINEAR):
+    if center is None:
+        center = (img.shape[1]//2,img.shape[0]//2)
+    if dsize is None:
+        dsize=(img.shape[1],img.shape[0])
+        M = cv2.getRotationMatrix2D(center,angle,scale)
+    else:
+        M = wa.getRotationMatrix2D(center,angle,scale,out_offset=(dsize[0]//2,dsize[1]//2))
+    img = cv2.warpAffine(img,M,dsize,borderValue=border_value,flags=interpolation)
+    return img
+def rotate_img_file(filepath,angle,scale=1.0):
+    img = cv2.imread(filepath)
+    center = (img.shape[1]//2,img.shape[0]//2)
+    M = cv2.getRotationMatrix2D(center,angle,scale)
+    img = cv2.warpAffine(img,M,(img.shape[1],img.shape[0]))
+    cv2.imwrite(filepath,img)
+'''
+box:[ymin,xmin,ymax,xmax], relative coordinate
+crop_size:[heigh,width] absolute pixel size.
+'''
+def crop_and_resize(img,box,crop_size):
+    img = crop_img(img,box)
+    return resize_img(img,crop_size)
+'''
+img:[H,W]/[H,W,C]
+box:[N,4] ymin,xmin,ymax,xmax, relative corrdinate
+从同一个图上切图
+'''
+def crop_and_resize_imgs(img,boxes,crop_size):
+    res_imgs = []
+    for box in boxes:
+        sub_img = crop_and_resize(img,box,crop_size)
+        res_imgs.append(sub_img)
+    return np.stack(res_imgs,axis=0)
+'''
+img:[N,H,W]/[N,H,W,C]
+box:[N,4] ymin,xmin,ymax,xmax, relative corrdinate
+box 与 img一对一的进行切图
+return:
+[N]+crop_size
+'''
+def one_to_one_crop_and_resize_imgs(imgs,boxes,crop_size):
+    res_imgs = []
+    for i,box in enumerate(boxes):
+        sub_img = crop_and_resize(imgs[i],box,crop_size)
+        res_imgs.append(sub_img)
+    return np.stack(res_imgs,axis=0)
+'''
+img:[H,W,C]
+size:(w,h)
+'''
+CENTER_PAD=0
+RANDOM_PAD=1
+TOPLEFT_PAD=2
+def pad_img(img,size,pad_value=127,pad_type=CENTER_PAD,return_pad_value=False):
+    '''
+    pad_type: 0, center pad
+    pad_type: 1, random pad
+    pad_type: 2, topleft_pad
+    '''
+    if pad_type==0:
+        if img.shape[0]<size[1]:
+            py0 = (size[1]-img.shape[0])//2
+            py1 = size[1]-img.shape[0]-py0
+        else:
+            py0 = 0
+            py1 = 0
+        if img.shape[1]<size[0]:
+            px0 = (size[0] - img.shape[1]) // 2
+            px1 = size[0] - img.shape[1] - px0
+        else:
+            px0 = 0
+            px1 = 0
+    elif pad_type==1:
+        if img.shape[0]<size[1]:
+            py0 = random.randint(0,size[1]-img.shape[0])
+            py1 = size[1]-img.shape[0]-py0
+        else:
+            py0 = 0
+            py1 = 0
+        if img.shape[1]<size[0]:
+            px0 = random.randint(0,size[0]-img.shape[1])
+            px1 = size[0] - img.shape[1] - px0
+        else:
+            px0 = 0
+            px1 = 0
+    elif pad_type==2:
+        if img.shape[0]<size[1]:
+            py0 = 0
+            py1 = size[1]-img.shape[0]-py0
+        else:
+            py0 = 0
+            py1 = 0
+        if img.shape[1]<size[0]:
+            px0 = 0
+            px1 = size[0] - img.shape[1] - px0
+        else:
+            px0 = 0
+            px1 = 0
+    if len(img.shape)==3:
+        img = np.pad(img, [[py0, py1], [px0, px1], [0, 0]], constant_values=pad_value)
+    else:
+        img = np.pad(img, [[py0, py1], [px0, px1]], constant_values=pad_value)
+    if return_pad_value:
+        return img,px0,px1,py0,py1
+    return img
+'''
+img:[H,W,C]
+size:(w,h)
+'''
+def pad_imgv2(img,size,pad_color=(0,0,0),center_pad=False):
+    if img.shape[0] == size[1] and img.shape[1] == size[0]:
+        return img
+    else:
+        res = np.ones([size[1],size[0],3],dtype=img.dtype)
+        pad_color = np.array(list(pad_color),dtype=img.dtype)
+        pad_color = pad_color.reshape([1,1,3])
+        res = res*pad_color
+        if center_pad:
+            offset_x = (size[0]-img.shape[1])//2
+            offset_y = (size[1]-img.shape[0])//2
+        else:
+            offset_x = 0
+            offset_y = 0
+        w = img.shape[1]
+        h = img.shape[0]
+        res[offset_y:offset_y+h,offset_x:offset_x+w,:] = img
+        return res
+def pad_imgv2(img,px0,px1,py0,py1,pad_value=127):
+    if len(img.shape)==3:
+        img = np.pad(img, [[py0, py1], [px0, px1], [0, 0]], constant_values=pad_value)
+    else:
+        img = np.pad(img, [[py0, py1], [px0, px1]], constant_values=pad_value)
+    return img
+'''
+img:[H,W]/[H,W,C]
+rect:[N,4] [xmin,ymin,xmax,ymax] absolute coordinate
+'''
+def sub_imagesv2(img,rects):
+    res = []
+    for rect in rects:
+        res.append(sub_imagev2(img,rect))
+    return res
+def __get_discrete_palette(palette=[(0,(0,0,255)),(0.5,(255,255,255)),(1.0,(255,0,0))],nr=1000):
+    res = np.zeros([nr,3],dtype=np.float32)
+    pre_p = palette[0]
+    for cur_p in palette[1:]:
+        end_idx = min(math.ceil(cur_p[0]*nr),nr)
+        beg_idx = min(max(math.floor(pre_p[0]*nr),0),end_idx)
+        color0 = np.array(pre_p[1],dtype=np.float32)
+        color1 = np.array(cur_p[1],dtype=np.float32)
+        for i in range(beg_idx,end_idx):
+            cur_color = (i-beg_idx)*(color1-color0)/(end_idx-beg_idx)+color0
+            res[i] = cur_color
+        pre_p = cur_p
+    res = np.clip(res,0,255)
+    res = res.astype(np.uint8)
+    return res
+def __get_discrete_img(img,nr=1000):
+    img = img.astype(np.float32)*(nr-1)
+    img = np.clip(img,0,nr-1)
+    img = img.astype(np.int32)
+    return img
+def pseudocolor_img(img,palette=[(0,(0,0,255)),(0.5,(255,255,255)),(1.0,(255,0,0))],auto_norm=True):
+    '''
+    img: (H,W) #float, value in [0,1] if auto_norm is not True
+    '''
+    if auto_norm:
+        img = normal_image(img,0.0,1.0,dtype=np.float32)
+    color_nr = 256
+    img = __get_discrete_img(img,nr=color_nr)
+    palette = __get_discrete_palette(palette,nr=color_nr)
+    H,W = img.shape
+    img = np.reshape(img,[-1])
+    new_img = palette[img]
+    new_img = np.reshape(new_img,[H,W,3])
+    return new_img