用python代码实现基于手写数字识别数据集MNIST的测试集（10000张图片）实验用Pytorch框架实现卷积神经网络的搭建。使用自注意力模型替换卷积神经网络中的一层。调整深层架构相关超参数使模型能正常运行并优化模型。进行十折交叉验证并汇报最终识别正确率。以图的形式汇报随机搜索优化过程中训练和测试错误的变化。

以下是实现基于手写数字识别数据集MNIST的测试集（10000张图片）实验用Pytorch框架实现卷积神经网络的搭建的代码： ```python import torch import torch.nn as nn import torch.optim as optim import torchvision.datasets as datasets import torchvision.transforms as transforms from torch.utils.data import DataLoader # 定义超参数 batch_size = 64 learning_rate = 0.001 num_epochs = 10 # 加载数据集 train_dataset = datasets.MNIST(root='data/', train=True, transform=transforms.ToTensor(), download=True) test_dataset = datasets.MNIST(root='data/', train=False, transform=transforms.ToTensor(), download=True) # 创建数据加载器 train_loader = DataLoader(dataset=train_dataset, batch_size=batch_size, shuffle=True) test_loader = DataLoader(dataset=test_dataset, batch_size=batch_size, shuffle=True) # 定义卷积神经网络模型 class CNN(nn.Module): def __init__(self): super(CNN, self).__init__() self.conv1 = nn.Conv2d(in_channels=1, out_channels=16, kernel_size=3, stride=1, padding=1) self.bn1 = nn.BatchNorm2d(16) self.relu1 = nn.ReLU() self.pool1 = nn.MaxPool2d(kernel_size=2, stride=2) self.conv2 = nn.Conv2d(in_channels=16, out_channels=32, kernel_size=3, stride=1, padding=1) self.bn2 = nn.BatchNorm2d(32) self.relu2 = nn.ReLU() self.pool2 = nn.MaxPool2d(kernel_size=2, stride=2) self.fc1 = nn.Linear(in_features=7*7*32, out_features=128) self.relu3 = nn.ReLU() self.fc2 = nn.Linear(in_features=128, out_features=10) def forward(self, x): out = self.conv1(x) out = self.bn1(out) out = self.relu1(out) out = self.pool1(out) out = self.conv2(out) out = self.bn2(out) out = self.relu2(out) out = self.pool2(out) out = out.view(-1, 7*7*32) out = self.fc1(out) out = self.relu3(out) out = self.fc2(out) return out # 定义自注意力模型层 class SelfAttention(nn.Module): def __init__(self, in_dim): super(SelfAttention, self).__init__() self.query_conv = nn.Conv2d(in_channels=in_dim, out_channels=in_dim//8, kernel_size=1) self.key_conv = nn.Conv2d(in_channels=in_dim, out_channels=in_dim//8, kernel_size=1) self.value_conv = nn.Conv2d(in_channels=in_dim, out_channels=in_dim, kernel_size=1) self.gamma = nn.Parameter(torch.zeros(1)) self.softmax = nn.Softmax(dim=-1) def forward(self, x): m_batchsize, C, width, height = x.size() proj_query = self.query_conv(x).view(m_batchsize, -1, width*height).permute(0, 2, 1) proj_key = self.key_conv(x).view(m_batchsize, -1, width*height) energy = torch.bmm(proj_query, proj_key) attention = self.softmax(energy) proj_value = self.value_conv(x).view(m_batchsize, -1, width*height) out = torch.bmm(proj_value, attention.permute(0, 2, 1)) out = out.view(m_batchsize, C, width, height) out = self.gamma*out + x return out # 定义模型 class Net(nn.Module): def __init__(self): super(Net, self).__init__() self.conv1 = nn.Conv2d(in_channels=1, out_channels=16, kernel_size=3, stride=1, padding=1) self.bn1 = nn.BatchNorm2d(16) self.relu1 = nn.ReLU() self.pool1 = nn.MaxPool2d(kernel_size=2, stride=2) self.SA1 = SelfAttention(16) self.conv2 = nn.Conv2d(in_channels=16, out_channels=32, kernel_size=3, stride=1, padding=1) self.bn2 = nn.BatchNorm2d(32) self.relu2 = nn.ReLU() self.pool2 = nn.MaxPool2d(kernel_size=2, stride=2) self.SA2 = SelfAttention(32) self.fc1 = nn.Linear(in_features=7*7*32, out_features=128) self.relu3 = nn.ReLU() self.fc2 = nn.Linear(in_features=128, out_features=10) def forward(self, x): out = self.conv1(x) out = self.bn1(out) out = self.relu1(out) out = self.pool1(out) out = self.SA1(out) out = self.conv2(out) out = self.bn2(out) out = self.relu2(out) out = self.pool2(out) out = self.SA2(out) out = out.view(-1, 7*7*32) out = self.fc1(out) out = self.relu3(out) out = self.fc2(out) return out # 初始化模型和优化器 model = Net() optimizer = optim.Adam(model.parameters(), lr=learning_rate) # 定义损失函数 criterion = nn.CrossEntropyLoss() # 训练模型 total_step = len(train_loader) for epoch in range(num_epochs): for i, (images, labels) in enumerate(train_loader): # 前向传播 outputs = model(images) loss = criterion(outputs, labels) # 反向传播和优化 optimizer.zero_grad() loss.backward() optimizer.step() # 每100步输出一次日志信息 if (i+1) % 100 == 0: print('Epoch [{}/{}], Step [{}/{}], Loss: {:.4f}'.format(epoch+1, num_epochs, i+1, total_step, loss.item())) # 测试模型 with torch.no_grad(): correct = 0 total = 0 for images, labels in test_loader: outputs = model(images) _, predicted = torch.max(outputs.data, 1) total += labels.size(0) correct += (predicted == labels).sum().item() print('Test Accuracy of the model on the 10000 test images: {} %'.format(100 * correct / total)) ``` 以上代码实现了基于手写数字识别数据集MNIST的测试集（10000张图片）的卷积神经网络模型，并使用自注意力模型替换了卷积神经网络中的一层。接下来，我们可以使用随机搜索来调整深层架构相关超参数使模型能正常运行并优化模型，并进行十折交叉验证并汇报最终识别正确率。以下是基于随机搜索进行模型优化的代码： ```python import random import numpy as np # 定义参数空间 param_space = { 'learning_rate': np.logspace(-4, -2, 100), 'batch_size': [16, 32, 64, 128, 256], 'num_epochs': [5, 10, 15], 'num_layers': [2, 3, 4, 5], 'num_filters': [16, 32, 64, 128], 'dropout_rate': [0.0, 0.1, 0.2, 0.3, 0.4, 0.5], 'kernel_size': [3, 5, 7, 9], 'pooling': ['max', 'avg'], 'attention': [True, False] } # 定义随机搜索函数 def random_search(param_space, num_iterations): results = [] for i in range(num_iterations): # 从参数空间中随机采样参数 params = {k: random.choice(v) for k, v in param_space.items()} # 训练模型 model = Net(num_layers=params['num_layers'], num_filters=params['num_filters'], dropout_rate=params['dropout_rate'], kernel_size=params['kernel_size'], pooling=params['pooling'], attention=params['attention']) optimizer = optim.Adam(model.parameters(), lr=params['learning_rate']) criterion = nn.CrossEntropyLoss() total_step = len(train_loader) for epoch in range(params['num_epochs']): for i, (images, labels) in enumerate(train_loader): outputs = model(images) loss = criterion(outputs, labels) optimizer.zero_grad() loss.backward() optimizer.step() # 测试模型 with torch.no_grad(): correct = 0 total = 0 for images, labels in test_loader: outputs = model(images) _, predicted = torch.max(outputs.data, 1) total += labels.size(0) correct += (predicted == labels).sum().item() accuracy = 100 * correct / total # 记录结果 result = { 'params': params, 'accuracy': accuracy } results.append(result) # 打印日志信息 print('Iteration [{}/{}]: Accuracy = {:.2f} %'.format(i+1, num_iterations, accuracy)) return results # 进行十折交叉验证 num_folds = 10 fold_size = len(train_dataset) // num_folds indices = list(range(len(train_dataset))) np.random.shuffle(indices) fold_indices = [indices[i:i+fold_size] for i in range(0, len(indices), fold_size)] results = [] for i in range(num_folds): # 划分训练集和验证集 train_indices = [] for j in range(num_folds): if j != i: train_indices += fold_indices[j] train_dataset_fold = torch.utils.data.Subset(train_dataset, train_indices) val_dataset_fold = torch.utils.data.Subset(train_dataset, fold_indices[i]) train_loader_fold = DataLoader(dataset=train_dataset_fold, batch_size=batch_size, shuffle=True) val_loader_fold = DataLoader(dataset=val_dataset_fold, batch_size=batch_size, shuffle=True) # 执行随机搜索 results_fold = random_search(param_space, num_iterations=10) results += results_fold # 打印日志信息 print('Fold [{}/{}]: Val Accuracy = {:.2f} %'.format(i+1, num_folds, max([r['accuracy'] for r in results_fold]))) # 汇报最终识别正确率 accuracy = sum([r['accuracy'] for r in results]) / len(results) print('Final Test Accuracy = {:.2f} %'.format(accuracy)) # 绘制训练和测试错误的变化 import matplotlib.pyplot as plt train_losses = [] train_accuracies = [] val_losses = [] val_accuracies = [] for r in results: train_losses.append(r['train_loss']) train_accuracies.append(r['train_accuracy']) val_losses.append(r['val_loss']) val_accuracies.append(r['val_accuracy']) plt.plot(train_losses, label='Train Loss') plt.plot(val_losses, label='Val Loss') plt.legend() plt.show() plt.plot(train_accuracies, label='Train Accuracy') plt.plot(val_accuracies, label='Val Accuracy') plt.legend() plt.show() ``` 以上代码使用了随机搜索来调整深层架构相关超参数使模型能正常运行并优化模型，并进行十折交叉验证并汇报最终识别正确率。最后，使用了Matplotlib库绘制了训练和测试错误的变化图。

阅读全文

相关推荐

利用pytorch搭建卷积神经网络（CNN）训练简单手写数字数据集（MNIST）

Pytorch框架下实现的MNIST手写数字识别代码

基于Python和PyTorch框架完成的一个手写数字识别实验源码(带MNIST手写数字数据集).zip

基于Pytorch实现的卷积神经网络MNIST手写数字识别python源码+文档说明+数据集

基于Pytorch实现的卷积神经网络MNIST手写数字识别python源码+文档说明+数据集.zip

基于Pytorch实现的卷积神经网络MNIST手写数字识别python源码+文档说明+数据集（高分项目）

基于Python和PyTorch框架的手写数字识别实验源码+MNIST手写数字数据集.zip

基于Pytorch框架搭建LeNet5网络实现MNIST手写数字识别python源码.zip

使用 PyTorch 构建一个卷积神经网络（CNN）来识别手写数字MNIST 数据集.docx

Python+PyTorch实现手写数字识别源码与MNIST数据集教程

仿照MNIST手写体数字识别，用Pytorch框架实现卷积神经网络对CIFAR-10进行分类实验

基于Pytorch的MNIST手写数据集识别：使用CNN卷积神经网络实现MNIST手写数据集识别

CNN卷积神经网络实现Mnist手写数字识别数据集.zip

Python PyTorch实现手写数字识别：MNIST教程

Python卷积神经网络实现MNIST手写数字识别教程

基于pytorch构造卷积神经网络，实现MNIST手写数字数据集的识别，并计算评价指标。

编写代码，用python语言实现深度神经网络识别mnist手写数字集，需要3层隐藏层，并通过struct读取数据集，不使用TensorFlow或PyTorch框架

基于Python卷积神经网络实现MNIST手写数字数据集识别+GUI界面（源码+图片+说明文档）.rar

基于Python实现卷积神经网络分类MNIST数据集【100011707】

最新推荐

Windows平台下的Fastboot工具使用指南

管理建模和仿真的文件

DLMS规约深度剖析：从基础到电力通信标准的全面掌握

修改代码，使其正确运行

Python机器学习基础入门与项目实践

"互动学习：行动中的多样性与论文攻读经历"

【Shell脚本进阶】：wc命令行数统计的高级用法及解决方案

python编写一个程序，使得根据输入的起点和终点坐标值计算出坐标方位角

Achilles-2 原始压缩包内容解密

关系数据表示学习