天天看點

pytorch入門08--資料集轉換 transform

#資料集轉換 transform
import torch
import torchvision
from torch.utils.data import Dataset
import numpy as np


class WineDataset(Dataset):

    def __init__(self, transform=None):
        xy = np.loadtxt('./wine.csv', delimiter=',', dtype=np.float32, skiprows=1)
        self.n_samples = xy.shape[0]

        # note that we do not convert to tensor here
        self.x_data = xy[:, 1:]
        self.y_data = xy[:, [0]]
        self.transform = transform

    def __getitem__(self, index):  #用來擷取一些索引的資料,使dataset[i]傳回資料集中第i個樣本。
        sample = self.x_data[index], self.y_data[index]
        if self.transform:
            sample = self.transform(sample)
        return sample

    def __len__(self):   #實作len(dataset)傳回整個資料集的大小
        return self.n_samples

# Custom Transforms
# implement __call__(self, sample)
class ToTensor:
    # Convert ndarrays to Tensors  調用父類參數,無需再初始化 傳入參數
    def __call__(self, sample):
        inputs, targets = sample
        return torch.from_numpy(inputs), torch.from_numpy(targets)

class MulTransform:
    # multiply inputs with a given factor
    def __init__(self, factor):   #需要傳入參數factor,需要init初始化
        self.factor = factor

    def __call__(self, sample):
        inputs, targets = sample
        inputs *= self.factor
        return inputs, targets

print('Without Transform')
dataset = WineDataset()
first_data = dataset[0]
features, labels = first_data
print(type(features), type(labels))
print(features, labels)

print('\nWith Tensor Transform')
dataset = WineDataset(transform=ToTensor()) #擷取酒類資料集,并用transform調用前面定義好的ToTensor轉換類型
first_data = dataset[0]     #擷取第一行資料
features, labels = first_data  #将第一行的特征賦予features,将第一韓的标簽賦予labels
print(type(features), type(labels)) #列印類型 主要看是否轉化為了tensor類型
print(features, labels)

print('\nWith Tensor and Multiplication Transform')
#torchvision.transforms.Compose組合變換連續一起操作
composed = torchvision.transforms.Compose([ToTensor(), MulTransform(4)])  #同時使用多個轉換
dataset = WineDataset(transform=composed)
first_data = dataset[0]
features, labels = first_data
print(type(features), type(labels))
print(features, labels)