numpy + plt + cv2 图像切片成 patches

作者: 谢小帅 | 来源:发表于2019-03-17 13:50 被阅读0次

将图像切分为图像块，并复原 - 知乎

起因：为了将场景分割并行化，考虑将原始图片切分成小的 patches，不同 patch 之间没有 overlap 区域，如下图，模型可以并行 12 份处理原始图片。

cut_img.py

用 plt 和 cv2 分别实现，plt 白边太大不美观，cv2 较好。

import skimage.io
import skimage.transform
import numpy as np
import matplotlib.pyplot as plt
import cv2


def cut_patches(img, patch_size, stride_x, stride_y):
    """
    cut one img into sub imgs with patch_size
    :param img: src img
    :param patch_size: sub img size, eg (160, 160) h, w
    :param stride_x: stride along x axis, eg 160
    :param stride_y: stride along y axis, eg 160
    :return: res: np.(patches_num, patch_w, patch_h, channels)
    """
    assert isinstance(patch_size, tuple) and len(patch_size) == 2
    img_h, img_w = img.shape[0], img.shape[1]
    # begin (x,y) left_top
    range_x = np.arange(0, img_w - patch_size[0], step=stride_x)
    range_y = np.arange(0, img_h - patch_size[1], step=stride_y)

    if range_x[-1] < img_w - patch_size[0]:  # stride 可能使得 arange 不能取到最右点，补充1个
        range_x = np.append(range_x, img_w - patch_size[0])
    if range_y[-1] < img_h - patch_size[1]:
        range_y = np.append(range_y, img_h - patch_size[1])

    patches = len(range_x) * len(range_y)  # sub imgs num

    res = None
    if len(img.shape) == 2:
        res = np.zeros((patches, patch_size[0], patch_size[1]))
    if len(img.shape) == 3:
        res = np.zeros((patches, patch_size[0], patch_size[1], img.shape[2]))

    index = 0
    for y in range_y:
        for x in range_x:
            patch = img[y:y + patch_size[1], x:x + patch_size[0]]
            res[index] = patch
            index += 1
    return res


# plt 做出图片还是有很大的白色 board
def plt_patches(img_patches, patch_size, img_size):
    patches_num = img_patches.shape[0]
    rows = int(img_size[0] / patch_size[0])
    cols = int(img_size[1] / patch_size[1])

    # plt 作图需要 img val [0,1]
    divider = 255  # rgb
    if len(img_patches.shape) == 3:  # gray
        divider = 65535

    for i in range(patches_num):
        plt.subplot(rows, cols, i + 1)
        plt.imshow(img_patches[i] / divider)
        plt.axis('off')
    plt.subplots_adjust(wspace=0.02, hspace=0.02)
    plt.show()


# space 精确控制 patches 边界
def cv2_patches(img_patches, patch_size, img_size, space, filename):  # space 两个 patch 之间的像素数
    rows = int(img_size[0] / patch_size[0])
    cols = int(img_size[1] / patch_size[1])

    res = None
    res_h = img_size[0] + (rows - 1) * space
    res_w = img_size[1] + (cols - 1) * space

    if len(img_patches.shape) == 3:  # gray
        res = 65535 * np.ones((res_h, res_w)).astype(np.uint16)  # 先置为全白，再填充
    if len(img_patches.shape) == 4:  # rgb
        res = 255 * np.ones((res_h, res_w, 3)).astype(np.uint8)

    index = 0
    for i in range(rows):
        for j in range(cols):
            begin_h = (patch_size[0] + space) * i
            begin_w = (patch_size[1] + space) * j
            res[begin_h:begin_h + patch_size[0], begin_w:begin_w + patch_size[1]] = img_patches[index]
            index += 1

    if len(img_patches.shape) == 4:
        res = cv2.cvtColor(res, cv2.COLOR_RGB2BGR)
    cv2.imwrite(filename, res)


def test_plt():
    img_size = (480, 640)
    # read
    rgb = skimage.io.imread('rgb.jpg')
    depth = skimage.io.imread('depth.png')
    label = skimage.io.imread('label.png')
    # transform
    rgb = skimage.transform.resize(rgb, img_size,
                                   order=1, mode='reflect', preserve_range=True, anti_aliasing=True)
    depth = skimage.transform.resize(depth, img_size,
                                     order=0, mode='reflect', preserve_range=True, anti_aliasing=True)
    label = skimage.transform.resize(label, img_size,
                                     order=0, mode='reflect', preserve_range=True, anti_aliasing=True)

    patch_size = (160, 160)

    rgb_patches = cut_patches(rgb, patch_size, stride_x=patch_size[1], stride_y=patch_size[0])
    plt_patches(rgb_patches, patch_size, img_size)

    depth_patches = cut_patches(depth, patch_size, stride_x=patch_size[1], stride_y=patch_size[0])
    plt_patches(depth_patches, patch_size, img_size)

    label_patches = cut_patches(label, patch_size, stride_x=patch_size[1], stride_y=patch_size[0])
    plt_patches(label_patches, patch_size, img_size)


def test_cv2():
    img_size = (480, 640)
    # read
    rgb = skimage.io.imread('rgb.jpg')
    depth = skimage.io.imread('depth.png')
    label = skimage.io.imread('label.png')
    # transform
    rgb = skimage.transform.resize(rgb, img_size,
                                   order=1, mode='reflect', preserve_range=True, anti_aliasing=True)
    depth = skimage.transform.resize(depth, img_size,
                                     order=0, mode='reflect', preserve_range=True, anti_aliasing=True)
    label = skimage.transform.resize(label, img_size,
                                     order=0, mode='reflect', preserve_range=True, anti_aliasing=True)

    patch_size = (160, 160)

    rgb_patches = cut_patches(rgb, patch_size, stride_x=patch_size[1], stride_y=patch_size[0])
    cv2_patches(rgb_patches, patch_size, img_size, space=5, filename='rgb_patches.jpg')

    depth_patches = cut_patches(depth, patch_size, stride_x=patch_size[1], stride_y=patch_size[0])
    cv2_patches(depth_patches, patch_size, img_size, space=5, filename='depth_patches.png')

    label_patches = cut_patches(label, patch_size, stride_x=patch_size[1], stride_y=patch_size[0])
    cv2_patches(label_patches, patch_size, img_size, space=5, filename='label_patches.png')


if __name__ == '__main__':
    test_cv2()

网友评论

本文标题：numpy + plt + cv2 图像切片成 patches

本文链接：https://www.haomeiwen.com/subject/nvcumqtx.html

延伸阅读

深度阅读

您也可以注册成为美文阅读网的作者，发表您的原创作品、分享您的心情！

numpy + plt + cv2 图像切片成 patches

相关文章

网友评论

延伸阅读

深度阅读

栏目导航

热点阅读