Python 基于自定义数据集的PyTorch图像分类_Python_Pytorch

Python 基于自定义数据集的PyTorch图像分类

python pytorch

Python 基于自定义数据集的PyTorch图像分类,python,pytorch,Python,Pytorch,在人工智能和神经网络方面，我仍然是一个初学者，在学习的过程中，我试图做一些例子，但我有一个问题，不知道如何解决它。如果你们中有人能帮助我，我将非常感激我想做什么？使用PyTorch和一些自定义数据集对10种动物进行简单的图像分类我的图像每个图像的形状为（3200200）此外，我在每个文件夹上都有大约40个图像（训练和测试）我的数据文件夹看起来怎么样？训练猫狗老鼠试验猫狗老鼠我的型号 class NetModel(nn.Module): def

在人工智能和神经网络方面，我仍然是一个初学者，在学习的过程中，我试图做一些例子，但我有一个问题，不知道如何解决它。如果你们中有人能帮助我，我将非常感激

我想做什么？

使用PyTorch和一些自定义数据集对10种动物进行简单的图像分类

我的图像

每个图像的形状为（3200200）

此外，我在每个文件夹上都有大约40个图像（训练和测试）

我的数据文件夹看起来怎么样？

训练
- 猫
- 狗
- 老鼠
试验
- 猫
- 狗
- 老鼠

我的型号

class NetModel(nn.Module):
    def __init__(self):
        super(NetModel, self).__init__()
        self.conv1 = nn.Conv2d(3, 6, 5)
        self.pool = nn.MaxPool2d(2, 2)
        self.conv2 = nn.Conv2d(6, 16, 5)
        self.fc1 = nn.Linear(16 * 5 * 5, 120)
        self.fc2 = nn.Linear(120, 84)
        self.fc3 = nn.Linear(84, 10)

    def forward(self, x):
        x = self.pool(F.relu(self.conv1(x)))
        x = self.pool(F.relu(self.conv2(x)))
        x = x.view(-1, 16 * 5 * 5)
        x = F.relu(self.fc1(x))
        x = F.relu(self.fc2(x))
        x = self.fc3(x)
        return x


def train_model(model, train_loader, optimizer, criterion, epochs, save_path):
    for epoch in range(epochs):  # loop over the dataset multiple times
        running_loss = 0.0
        for i, data in enumerate(train_loader, 0):
            # get the inputs; data is a list of [inputs, labels]
            inputs, labels = data
            # zero the parameter gradients
            optimizer.zero_grad()

            # forward + backward + optimize
            outputs = model(inputs)
            loss = criterion(outputs, labels)
            loss.backward()
            optimizer.step()

            # print statistics
            running_loss += loss.item()
            if i % 2000 == 1999:  # print every 2000 mini-batches
                print('[%d, %5d] loss: %.3f' %
                      (epoch + 1, i + 1, running_loss / 2000))
                running_loss = 0.0
    print('Finished Training')
    # PATH = './cifar_net.pth'
    torch.save(model.state_dict(), save_path)
    print('Saved in: {}'.format(save_path))


def test(model, test_loader, classes, saved_path):
    model.load_state_dict(torch.load(saved_path))

    dataiter = iter(test_loader)
    images, labels = dataiter.next()

    print('GroundTruth: ', ' '.join('%5s' % classes[labels[j]] for j in range(4)))

    outputs = model(images)

    _, predicted = torch.max(outputs, 1)

    print('Predicted: ', ' '.join('%5s' % classes[predicted[j]] for j in range(4)))


transform = transforms.Compose(
    [transforms.ToTensor(),
     transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5))])

charset = string.ascii_letters + "-' "
trainset = TESNamesDataset('../data/train', charset, 10)
testset = TESNamesDataset('../data/test', charset, 10)


trainloader = torch.utils.data.DataLoader(trainset, batch_size=4,
                                          shuffle=True, num_workers=2)

testloader = torch.utils.data.DataLoader(testset, batch_size=4,
                                         shuffle=False, num_workers=2)

model = NetModel()

criterion = nn.CrossEntropyLoss()
optimizer = optim.SGD(model.parameters(), lr=0.001, momentum=0.9)

path = "../check_point/saved_model.pth"
train_model(model, trainloader, optimizer, criterion, 100, path)
test(model, testloader, animals, path)

我的自定义数据集

class TESNamesDataset(Dataset):
    def __init__(self, data_root, charset, length):
        self.data_root = data_root
        self.charset = charset + '\0'
        self.length = length
        self.samples = []
        self.char_codec = LabelEncoder()
        self._init_dataset()

    def __len__(self):
        return len(self.samples)

    def __getitem__(self, idx):
        name, pixels = self.samples[idx]
        return self.one_hot_sample(name), pixels

    def _init_dataset(self):
        names = set()
        # self.samples = []
        for animal in os.listdir(self.data_root):
            animal_filepath = os.path.join(self.data_root, animal)
            names.add(animal)
            for img_name in os.listdir(animal_filepath):
                img_path = os.path.join(animal_filepath, img_name)
                im = cv2.imread(img_path)
                if len(animal) < self.length:
                    animal += '\0' * (self.length - len(animal))
                else:
                    animal = animal[:self.length - 1] + '\0'
                self.samples.append((animal, im))

        self.char_codec.fit(list(self.charset))

    def to_one_hot(self, codec, values):
        value_idxs = codec.transform(values)
        return torch.eye(len(codec.classes_))[value_idxs]

    def one_hot_sample(self, name):
        t_name = self.to_one_hot(self.char_codec, list(name))
        return t_name

类数据集（数据集）：
def uuu init uuuu（self，data_root，字符集，长度）：
self.data\u root=数据\u root
self.charset=charset+'\0'
self.length=长度
self.samples=[]
self.char\u codec=LabelEncoder（）
self.\u init\u数据集（）
定义（自我）：
返回透镜（自采样）
def uu getitem uu（self，idx）：
名称，像素=self.samples[idx]
返回self.one_hot_样本（名称），像素
定义初始数据集（自）：
名称=集合（）
#self.samples=[]
对于os.listdir（self.data_root）中的动物：
animal\u filepath=os.path.join（self.data\u root，animal）
名称。添加（动物）
对于os.listdir（动物文件路径）中的img_名称：
img\u path=os.path.join（animal\u filepath，img\u name）
im=cv2.imread（img\u路径）
如果len（动物）<自身长度：
动物+='\0'*（self.length-len（动物））
其他：
动物=动物[：self.length-1]+“\0”
self.samples.append（（动物，im））
self.char\u codec.fit（list（self.charset））
def至_one_hot（自身、编解码器、值）：
value_idxs=codec.transform（值）
return torch.eye（len（codec.classes）[value]
def one溳hot潌潌悻悻悻悻悻悻
t_name=self.to_one_hot（self.char_编解码器，列表（名称））
返回t_名称

错误消息

运行时错误：四维权重6的预期四维输入 35，但得到了大小为[4,10,56]的三维输入

你们谁能告诉我我做错了什么？如果这个问题是离题的，请告诉我在哪里可以提问

谢谢