pytrorch学习(二十三)—torchvision加载VOC

作者: 侠之大者_7d3f | 来源:发表于2019-01-17 20:56 被阅读2次

pytrorch学习(二十三)—torchvision加载VOC
pytorch学习第一天
【深度学习DL-PyTorch】七、加载图像数据(Loading
Linux安装Pytorch+torchvision+torch
在本机一键搞定COCO和VOC数据集
torchvision指南
PASCAL VOC 数据集格式
Pytorch学习记录-使用Pytorch进行深度学习，数据加载
TorchVision
TorchVision

image.png

daima

import torchvision.datasets as datasets
import torchvision
import torch
import numpy as np
import cv2


def show_object_rect(image: np.ndarray, bndbox):
    pt1 = bndbox[:2]
    pt2 = bndbox[2:]
    image_show = image
    return cv2.rectangle(image_show, pt1, pt2, (0,255,255), 2)


def show_object_name(image: np.ndarray, name: str, p_tl):
    return cv2.putText(image, name, p_tl, 1, 1, (255, 0, 0))


voc_trainset = datasets.VOCDetection('/media/weipenghui/Extra/VOC/VOC_Detection_2012',year='2012', image_set='train', download=False)

print('-'*40)
print('VOC2012-trainval')
print(len(voc_trainset))

for i, sample in enumerate(voc_trainset, 1):
    image, annotation = sample[0], sample[1]['annotation']
    objects = annotation['object']
    show_image = np.array(image)
    print('{} object:{}'.format(i, len(objects)))
    if not isinstance(objects,list):
        object_name = objects['name']
        object_bndbox = objects['bndbox']
        x_min = int(object_bndbox['xmin'])
        y_min = int(object_bndbox['ymin'])
        x_max = int(object_bndbox['xmax'])
        y_max = int(object_bndbox['ymax'])
        show_image = show_object_rect(show_image, (x_min, y_min, x_max, y_max))
        show_image =show_object_name(show_image, object_name, (x_min, y_min))
    else:
        for j in objects:
            object_name = j['name']
            object_bndbox = j['bndbox']
            x_min = int(object_bndbox['xmin'])
            y_min = int(object_bndbox['ymin'])
            x_max = int(object_bndbox['xmax'])
            y_max = int(object_bndbox['ymax'])
            show_image = show_object_rect(show_image, (x_min, y_min, x_max, y_max))
            show_image = show_object_name(show_image, object_name, (x_min, y_min))

    cv2.imshow('image', show_image)
    cv2.waitKey(0)


print(voc_trainset)
print('Down load ok')