以下是一個簡單的示例,展示了如何使用 PyTorch 處理自定義圖像分類數據集:
import torch
import torch.nn as nn
import torch.optim as optim
import torchvision
import torchvision.transforms as transforms
from torch.utils.data import DataLoader
from torchvision.datasets import ImageFolder# 數據預處理
transform = transforms.Compose([transforms.Resize((64, 64)),transforms.ToTensor(),transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5))
])# 創建 ImageFolder 數據集實例
train_dataset = ImageFolder(root='path/to/dataset', transform=transform)# 創建數據加載器
batch_size = 64
data_loader = DataLoader(train_dataset, batch_size=batch_size, shuffle=True)# 定義簡單的卷積神經網絡模型
class SimpleCNN(nn.Module):def __init__(self):super(SimpleCNN, self).__init__()self.conv1 = nn.Conv2d(3, 32, kernel_size=3, padding=1)self.relu = nn.ReLU()self.pool = nn.MaxPool2d(kernel_size=2, stride=2)self.flatten = nn.Flatten()self.fc1 = nn.Linear(32*32*32, 128)self.fc2 = nn.Linear(128, len(train_dataset.classes)) # 類別數根據數據集自動調整def forward(self, x):x = self.conv1(x)x = self.relu(x)x = self.pool(x)x = self.flatten(x)x = self.fc1(x)x = self.relu(x)x = self.fc2(x)return x# 初始化模型、損失函數和優化器
model = SimpleCNN()
criterion = nn.CrossEntropyLoss()
optimizer = optim.Adam(model.parameters(), lr=0.001)# 訓練模型
num_epochs = 5
for epoch in range(num_epochs):for images, labels in data_loader:optimizer.zero_grad()outputs = model(images)loss = criterion(outputs, labels)loss.backward()optimizer.step()print(f'Epoch [{epoch+1}/{num_epochs}], Loss: {loss.item():.4f}')# 保存模型
torch.save(model.state_dict(), 'custom_classifier_model.pth')# 測試模型
model.eval()
correct = 0
total = 0
with torch.no_grad():for images, labels in data_loader:outputs = model(images)_, predicted = torch.max(outputs.data, 1)total += labels.size(0)correct += (predicted == labels).sum().item()print(f'Accuracy on the test images: {100 * correct / total:.2f}%')
這里使用了 ImageFolder
數據集類,它會自動根據文件夾結構為每個類別分配標簽。請替換 'path/to/dataset'
為你實際的數據集路徑。這樣,你就無需手動指定文件路徑和標簽,代碼會自動從文件夾結構中獲取這些信息。