cuda(non_blocking=true)

def contrastive_evaluate(val_loader, model, memory_bank): top1 = AverageMeter('Acc@1', ':6.2f') model.eval() for batch in val_loader: images = batch['image'].cuda(non_blocking=True) target = batch['target'].cuda(non_blocking=True) constrastive_features, cluster_output = model(images) output = memory_bank.weighted_knn(constrastive_features) acc1 = 100*torch.mean(torch.eq(output, target).float()) top1.update(acc1.item(), images.size(0)) return top1.avg

这一个用于评估对比学习模型的函数contrastive_evaluate。它接受一个验证数据集val_loader，一个对比学习模型model，以及一个存储样本特征的内存库memory_bank。首先，创建一个用于计算准确率的AverageMeter对象...

pytorch部分代码如下：class LDAMLoss(nn.Module): def init(self, cls_num_list, max_m=0.5, weight=None, s=30): super(LDAMLoss, self).init() m_list = 1.0 / np.sqrt(np.sqrt(cls_num_list)) m_list = m_list * (max_m / np.max(m_list)) m_list = torch.cuda.FloatTensor(m_list) self.m_list = m_list assert s > 0 self.s = s if weight is not None: weight = torch.FloatTensor(weight).cuda() self.weight = weight self.cls_num_list = cls_num_list def forward(self, x, target): index = torch.zeros_like(x, dtype=torch.uint8) index_float = index.type(torch.cuda.FloatTensor) batch_m = torch.matmul(self.m_list[None, :], index_float.transpose(0,1)) batch_m = batch_m.view((-1, 1)) # size=(batch_size, 1) (-1,1) x_m = x - batch_m output = torch.where(index, x_m, x) if self.weight is not None: output = output * self.weight[None, :] logit = output * self.s return F.cross_entropy(logit, target, weight=self.weight) train_loader = torch.utils.data.DataLoader(dataset_train, batch_size=BATCH_SIZE, shuffle=True,drop_last=True) test_loader = torch.utils.data.DataLoader(dataset_test, batch_size=BATCH_SIZE, shuffle=True) cls_num_list = np.zeros(classes) for , label in train_loader.dataset: cls_num_list[label] += 1 criterion_train = LDAMLoss(cls_num_list=cls_num_list, max_m=0.5, s=30) criterion_val = LDAMLoss(cls_num_list=cls_num_list, max_m=0.5, s=30) mixup_fn = Mixup( mixup_alpha=0.8, cutmix_alpha=1.0, cutmix_minmax=None, prob=0.1, switch_prob=0.5, mode='batch', label_smoothing=0.1, num_classes=classes) for batch_idx, (data, target) in enumerate(train_loader): data, target = data.to(device, non_blocking=True), Variable(target).to(device,non_blocking=True) # 3、将数据输入mixup_fn生成mixup数据 samples, targets = mixup_fn(data, target) targets = torch.tensor(targets).to(torch.long) # 4、将上一步生成的数据输入model，输出预测结果，再计算loss output = model(samples) # 5、梯度清零（将loss关于weight的导数变成0） optimizer.zero_grad() # 6、若使用混合精度 if use_amp: with torch.cuda.amp.autocast(): # 开启混合精度 loss = torch.nan_to_num(criterion_train(output, targets)) # 计算loss scaler.scale(loss).backward() # 梯度放大 torch.nn.utils.clip_grad_norm(model.parameters(), CLIP_GRAD) # 梯度裁剪，防止梯度爆炸 scaler.step(optimizer) # 更新下一次迭代的scaler scaler.update() # 否则，直接反向传播求梯度 else: loss = criterion_train(output, targets) loss.backward() torch.nn.utils.clip_grad_norm_(model.parameters(), CLIP_GRAD) optimizer.step() 报错：RuntimeError: Expected index [112, 1] to be smaller than self [16, 7] apart from dimension 1

这个报错是因为在计算batch_m时，index_float的维度是反过来的，应该将index_float.transpose(0,1)改为index_float.transpose(1,0)，即将第0维和第1维交换。修改后的代码如下： ... batch_m = torch.matmul...

def selflabel_train(train_loader, model, criterion, optimizer, epoch, ema=None, output_file=None): """ Self-labeling based on confident samples """ losses = AverageMeter('Loss', ':.4e') progress = ProgressMeter(len(train_loader), [losses], prefix="Epoch: [{}]".format(epoch), output_file=output_file) model.train() for i, batch in enumerate(train_loader): images = batch['image'].cuda(non_blocking=True) images_augmented = batch['image_augmented'].cuda(non_blocking=True) with torch.no_grad(): output = model(images)[0] output_augmented = model(images_augmented)[0] loss = criterion(output, output_augmented) losses.update(loss.item()) optimizer.zero_grad() loss.backward() optimizer.step() if ema is not None: # Apply EMA to update the weights of the network ema.update_params(model) ema.apply_shadow(model) if i % 25 == 0: progress.display(i)

这段代码是一个自标记（self-labeling）训练的实现。函数接受训练数据加载器（train_loader）、模型（model）、损失函数（criterion）、优化器（optimizer）、当前的训练轮数（epoch）、指数移动平均（exponential ...

pytorch代码如下：class LDAMLoss(nn.Module): def init(self, cls_num_list, max_m=0.5, weight=None, s=30): super(LDAMLoss, self).init() m_list = 1.0 / np.sqrt(np.sqrt(cls_num_list)) m_list = m_list * (max_m / np.max(m_list)) m_list = torch.cuda.FloatTensor(m_list) self.m_list = m_list assert s > 0 self.s = s if weight is not None: weight = torch.FloatTensor(weight).cuda() self.weight = weight self.cls_num_list = cls_num_list def forward(self, x, target): index = torch.zeros_like(x, dtype=torch.uint8) index_float = index.type(torch.cuda.FloatTensor) batch_m = torch.matmul(self.m_list[None, :], index_float.transpose(1,0)) # 0,1 batch_m = batch_m.view((-1, 1)) # size=(batch_size, 1) (-1,1) x_m = x - batch_m output = torch.where(index, x_m, x) if self.weight is not None: output = output * self.weight[None, :] logit = output * self.s return F.cross_entropy(logit, target, weight=self.weight) classes=7, cls_num_list = np.zeros(classes) for , label in train_loader.dataset: cls_num_list[label] += 1 criterion_train = LDAMLoss(cls_num_list=cls_num_list, max_m=0.5, s=30) criterion_val = LDAMLoss(cls_num_list=cls_num_list, max_m=0.5, s=30) for batch_idx, (data, target) in enumerate(train_loader): data, target = data.to(device, non_blocking=True), Variable(target).to(device,non_blocking=True) # 3、将数据输入mixup_fn生成mixup数据 samples, targets = mixup_fn(data, target) targets = torch.tensor(targets).to(torch.long) # 4、将上一步生成的数据输入model，输出预测结果，再计算loss output = model(samples) # 5、梯度清零（将loss关于weight的导数变成0） optimizer.zero_grad() # 6、若使用混合精度 if use_amp: with torch.cuda.amp.autocast(): # 开启混合精度 loss = torch.nan_to_num(criterion_train(output, targets)) # 计算loss scaler.scale(loss).backward() # 梯度放大 torch.nn.utils.clip_grad_norm(model.parameters(), CLIP_GRAD) # 梯度裁剪，防止梯度爆炸 scaler.step(optimizer) # 更新下一次迭代的scaler scaler.update() 报错：File "/home/adminis/hpy/ConvNextV2_Demo/models/losses.py", line 53, in forward return F.cross_entropy(logit, target, weight=self.weight) File "/home/adminis/anaconda3/envs/wln/lib/python3.9/site-packages/torch/nn/functional.py", line 2824, in cross_entropy return torch._C._nn.cross_entropy_loss(input, target, weight, _Reduction.get_enum(reduction), ignore_index) RuntimeError: multi-target not supported at /pytorch/aten/src/THCUNN/generic/ClassNLLCriterion.cu:15

index_float = index.type(torch.cuda.FloatTensor) batch_m = torch.matmul(self.m_list[None, :], index_float.transpose(1,0)) # 0,1 batch_m = batch_m.view((-1, 1)) # size=(batch_size, 1) x_m = x - ...

pytorch部分代码如下：class LDAMLoss(nn.Module): def init(self, cls_num_list, max_m=0.5, weight=None, s=30): super(LDAMLoss, self).init() m_list = 1.0 / np.sqrt(np.sqrt(cls_num_list)) m_list = m_list * (max_m / np.max(m_list)) m_list = torch.cuda.FloatTensor(m_list) self.m_list = m_list assert s > 0 self.s = s # self.weight = weight if weight is not None: weight = torch.FloatTensor(weight).cuda() self.weight = weight self.cls_num_list = cls_num_list def forward(self, x, target): index = torch.zeros_like(x, dtype=torch.uint8) index_float = index.type(torch.cuda.FloatTensor) batch_m = torch.matmul(self.m_list[None, :], index_float.transpose(0,1)) # 0,1 batch_m = batch_m.view((x.size(0), 1)) # size=(batch_size, 1) (-1,1) x_m = x - batch_m output = torch.where(index, x_m, x) # return F.cross_entropy(self.soutput, target, weight=self.weight) if self.weight is not None: output = output self.weight[None, :] target = torch.flatten(target) # 将 target 转换成 1D Tensor logit = output * self.s return F.cross_entropy(logit, target, weight=self.weight) for batch_idx, (data, target) in enumerate(train_loader): data, target = data.to(device, non_blocking=True), Variable(target).to(device,non_blocking=True) # 3、将数据输入mixup_fn生成mixup数据 samples, targets = mixup_fn(data, target) # 4、将上一步生成的数据输入model，输出预测结果，再计算loss output = model(samples) # 5、梯度清零（将loss关于weight的导数变成0） optimizer.zero_grad() loss = criterion_train(output, targets) # 6、若使用混合精度 if use_amp: with torch.cuda.amp.autocast(): # 开启混合精度 # loss = torch.nan_to_num(criterion_train(output, target_a, target_b, lam)) # 计算loss # loss = lam * criterion_train(output, target_a) + (1 - lam) * criterion_train(output, target_b) # 计算 mixup 后的损失函数 scaler.scale(loss).backward() # 梯度放大 torch.nn.utils.clip_grad_norm_(model.parameters(), CLIP_GRAD) # 梯度裁剪，防止梯度爆炸 scaler.step(optimizer) # 更新下一次迭代的scaler scaler.update() # 否则，直接反向传播求梯度 else: # loss = criterion_train(output, targets) loss.backward() torch.nn.utils.clip_grad_norm_(model.parameters(), CLIP_GRAD) optimizer.step() 报错：) File "/home/adminis/hpy/ConvNextV2_Demo/models/losses.py", line 48, in forward output = torch.where(index, x_m, x) RuntimeError: expected scalar type float but found c10::Half

可以尝试将 index 和 index_float 的数据类型都指定为 torch.cuda.FloatTensor。修改代码如下： python index = torch.zeros_like(x, dtype=torch.uint8).cuda() index_float = index.type(torch.cuda....

pytorch部分代码如下：train_loss, train_acc = train(model_ft, DEVICE, train_loader, optimizer, epoch,model_ema) for batch_idx, (data, target) in enumerate(train_loader): data, target = data.to(device, non_blocking=True), Variable(target).to(device,non_blocking=True) samples, targets = mixup_fn(data, target) output = model(samples) optimizer.zero_grad() if use_amp: with torch.cuda.amp.autocast(): loss = torch.nan_to_num(criterion_train(output, targets)) scaler.scale(loss).backward() torch.nn.utils.clip_grad_norm_(model.parameters(), CLIP_GRAD) if not (self._backward_hooks or self._forward_hooks or self._forward_pre_hooks or _global_backward_hooks or global_forward_hooks or global_forward_pre_hooks): return forward_call(*input, **kwargs) class LDAMLoss(nn.Module): def init(self, cls_num_list, max_m=0.5, weight=None, s=30): super(LDAMLoss, self).init() m_list = 1.0 / np.sqrt(np.sqrt(cls_num_list)) m_list = m_list * (max_m / np.max(m_list)) m_list = torch.cuda.FloatTensor(m_list) self.m_list = m_list assert s > 0 self.s = s self.weight = weight def forward(self, x, target): index = torch.zeros_like(x, dtype=torch.uint8) target = torch.clamp(target, 0, index.size(1) - 1) index.scatter_(1, target.unsqueeze(1).type(torch.int64), 1) index = index[:, :x.size(1)] index_float = index.type(torch.cuda.FloatTensor) batch_m = torch.matmul(self.m_list[None, :], index_float.transpose(0,1)) batch_m = batch_m.view((-1, 1)) x_m = x - batch_m output = torch.where(index, x_m, x) return F.cross_entropy(self.soutput, target, weight=self.weight) 报错： File "/home/adminis/hpy/ConvNextV2_Demo/train+ca.py", line 46, in train loss = torch.nan_to_num(criterion_train(output, targets)) # 计算loss File "/home/adminis/anaconda3/envs/wln/lib/python3.9/site-packages/torch/nn/modules/module.py", line 1051, in _call_impl return forward_call(input, **kwargs) File "/home/adminis/hpy/ConvNextV2_Demo/models/utils.py", line 622, in forward index.scatter_(1, target.unsqueeze(1).type(torch.int64), 1) # target.data.view(-1, 1). RuntimeError: Index tensor must have the same number of dimensions as self tensor 帮我看看如何修改源代码

从错误信息来看，index张量的维度和target张量不匹配。你可以尝试检查以下target张量的形状，看是否存在问题。同时，你可以在 index.scatter_ 操作之前，将 index 张量的最后一维进行裁剪，使其与 output...

return t.to(device, dtype if t.is_floating_point() or t.is_complex() else None, non_blocking) File "C:\Users\86150\AppData\Local\Programs\Python\Python38\lib\site-packages\torch\cuda\init.py", line 239, in _lazy_init raise AssertionError("Torch not compiled with CUDA enabled") AssertionError: Torch not compiled with CUDA enabled

如果返回True，则表示CUDA支持已经启用。如果返回False，则表示CUDA支持未启用。 3. 如果你之前已经安装了PyTorch但没有启用CUDA支持，你可以尝试重新安装PyTorch并确保选择了CUDA支持。如果你仍然遇到问题，...

生成一个 pytorch ddp 训练和验证 resnet18 的例子，并且代码中 ddp 使用 mpirun 的方式启动

images = images.cuda(rank, non_blocking=True) labels = labels.cuda(rank, non_blocking=True) outputs = model(images) loss = criterion(outputs, labels) # 梯度下降 optimizer.zero_grad() loss....

如何使用自动分配显存功能

2. 将数据复制到 GPU 显存中，在复制时使用 non_blocking=True，以便将计算和数据传输异步化。 device = torch.device('cuda') x = x.to(device, non_blocking=True) 3. 在模型训练过程中，使用 ...

多核mmd的pytorch实现

在训练循环中，我们使用 cuda(non_blocking=True) 来将数据转移到 GPU 上，并在每个批次上进行前向传递、计算损失、反向传递和优化。最后，我们使用 dist.destroy_process_group 清理分布式训练环境。需要注意...

torch.tensor.to

x = x.to('cuda', non_blocking=True) # 创建一个 GPU 上的 IntTensor 对象 y = torch.tensor([1, 2, 3], device='cuda', dtype=torch.int) 注意：在使用 to() 方法时，原来的 Tensor 对象并不会被修改，而是...

单机多卡训练卷积神经网络

data, target = data.cuda(gpu, non_blocking=True), target.cuda(gpu, non_blocking=True) optimizer.zero_grad() output = ddp_model(data) loss = criterion(output, target) loss.backward() optimizer....

pytorch中to()用法

to()方法是PyTorch中非常重要的方法，主要...x = x.to('cuda', non_blocking=True) 总之，to()方法是PyTorch中非常常用的方法，可以方便地将Tensor和模型移动到指定的设备上，也可以方便地进行数据类型的转换。

torch.backends.cudnn报错

os.environ\["CUDA_LAUNCH_BLOCKING"\] = "1" os.environ\["CUBLAS_WORKSPACE_CONFIG"\] = ":16:8" np.random.seed(seed) torch.manual_seed(seed) torch.cuda.manual_seed(seed) torch.cuda.manual_seed_all...

cuda(non_blocking=true)

return outputs * self._scale.to(device=outputs.device, non_blocking=True) RuntimeError: CUDA error: device-side assert triggered

相关推荐

cuda(non_blocking=true)

return outputs * self._scale.to(device=outputs.device, non_blocking=True) RuntimeError: CUDA error: device-side assert triggered

相关推荐

blocking.rar_blocking _blocking probability

bp.rar_blocking probability_cell

Blocking_Socket_File.zip_blocking socket

生成一个 pytorch ddp 训练和验证 resnet18 的例子，并且代码中 ddp 使用 mpirun 的方式启动

如何使用自动分配显存功能

多核mmd的pytorch实现

torch.tensor.to

单机多卡训练卷积神经网络

pytorch中to()用法

torch.backends.cudnn报错

最新推荐

pre_o_1csdn63m9a1bs0e1rr51niuu33e.a

matlab建立计算力学课程的笔记和文件.zip

FT-Prog-v3.12.38.643-FTD USB 工作模式设定及eprom读写

matlab基于RRT和人工势场法混合算法的路径规划.zip

matlab基于matlab的两步定位软件定义接收机的开源GNSS直接位置估计插件模块.zip

zigbee-cluster-library-specification

管理建模和仿真的文件

实现实时数据湖架构：Kafka与Hive集成

2． 通过python绘制y=e-xsin(2πx)图像

JSBSim Reference Manual

2．通过python绘制y=e-xsin(2πx)图像