pytorch 训练数据以及测试 全部代码(1)
发布日期:2021-06-29 11:44:34
浏览次数:3
分类:技术文章
本文共 9090 字,大约阅读时间需要 30 分钟。
这个是deeplabV3+的训练代码,用于训练的数据是VOC2012 和SBD数据
import socketimport timeitfrom datetime import datetimeimport osimport globfrom collections import OrderedDict# PyTorch includesimport torchfrom torch.autograd import Variableimport torch.optim as optimfrom torchvision import transformsfrom torch.utils.data import DataLoaderfrom torchvision.utils import make_grid# Tensorboard includefrom tensorboardX import SummaryWriter# Custom includesfrom dataloaders import pascal, sbd, combine_dbsfrom dataloaders import utilsfrom networks import deeplab_xception, deeplab_resnetfrom dataloaders import custom_transforms as trgpu_id = 0print('Using GPU: {} '.format(gpu_id))# Setting parametersuse_sbd = True # Whether to use SBD datasetnEpochs = 100 # Number of epochs for trainingresume_epoch = 0 # Default is 0, change if want to resumep = OrderedDict() # Parameters to include in reportp['trainBatch'] = 6 # Training batch sizetestBatch = 6 # Testing batch sizeuseTest = True # See evolution of the test set when trainingnTestInterval = 5 # Run on test set every nTestInterval epochssnapshot = 10 # Store a model every snapshot epochsp['nAveGrad'] = 1 # Average the gradient of several iterationsp['lr'] = 1e-7 # Learning ratep['wd'] = 5e-4 # Weight decayp['momentum'] = 0.9 # Momentump['epoch_size'] = 10 # How many epochs to change learning ratebackbone = 'xception' # Use xception or resnet as feature extractor,save_dir_root = os.path.join(os.path.dirname(os.path.abspath(__file__)))exp_name = os.path.dirname(os.path.abspath(__file__)).split('/')[-1]if resume_epoch != 0: runs = sorted(glob.glob(os.path.join(save_dir_root, 'run', 'run_*'))) run_id = int(runs[-1].split('_')[-1]) if runs else 0else: runs = sorted(glob.glob(os.path.join(save_dir_root, 'run', 'run_*'))) run_id = int(runs[-1].split('_')[-1]) + 1 if runs else 0save_dir = os.path.join(save_dir_root, 'run', 'run_' + str(run_id))# Network definitionif backbone == 'xception': net = deeplab_xception.DeepLabv3_plus(nInputChannels=3, n_classes=21, os=16, pretrained=True)elif backbone == 'resnet': net = deeplab_resnet.DeepLabv3_plus(nInputChannels=3, n_classes=21, os=16, pretrained=True)else: raise NotImplementedErrormodelName = 'deeplabv3plus-' + backbone + '-voc'criterion = utils.cross_entropy2dif resume_epoch == 0: print("Training deeplabv3+ from scratch...")else: print("Initializing weights from: {}...".format( os.path.join(save_dir, 'models', modelName + '_epoch-' + str(resume_epoch - 1) + '.pth'))) net.load_state_dict( torch.load(os.path.join(save_dir, 'models', modelName + '_epoch-' + str(resume_epoch - 1) + '.pth'), map_location=lambda storage, loc: storage)) # Load all tensors onto the CPUif gpu_id >= 0: torch.cuda.set_device(device=gpu_id) net.cuda()if resume_epoch != nEpochs: # Logging into Tensorboard log_dir = os.path.join(save_dir, 'models', datetime.now().strftime('%b%d_%H-%M-%S') + '_' + socket.gethostname()) writer = SummaryWriter(log_dir=log_dir) # Use the following optimizer optimizer = optim.SGD(net.parameters(), lr=p['lr'], momentum=p['momentum'], weight_decay=p['wd']) p['optimizer'] = str(optimizer) composed_transforms_tr = transforms.Compose([ tr.RandomSized(512), tr.RandomRotate(15), tr.RandomHorizontalFlip(), tr.Normalize(mean=(0.485, 0.456, 0.406), std=(0.229, 0.224, 0.225)), tr.ToTensor()]) composed_transforms_ts = transforms.Compose([ tr.FixedResize(size=(512, 512)), tr.Normalize(mean=(0.485, 0.456, 0.406), std=(0.229, 0.224, 0.225)), tr.ToTensor()]) voc_train = pascal.VOCSegmentation(split='train', transform=composed_transforms_tr) voc_val = pascal.VOCSegmentation(split='val', transform=composed_transforms_ts) if use_sbd: print("Using SBD dataset") sbd_train = sbd.SBDSegmentation(split=['train', 'val'], transform=composed_transforms_tr) db_train = combine_dbs.CombineDBs([voc_train, sbd_train], excluded=[voc_val]) else: db_train = voc_train trainloader = DataLoader(db_train, batch_size=p['trainBatch'], shuffle=True, num_workers=0) testloader = DataLoader(voc_val, batch_size=testBatch, shuffle=False, num_workers=0) utils.generate_param_report(os.path.join(save_dir, exp_name + '.txt'), p) num_img_tr = len(trainloader) num_img_ts = len(testloader) running_loss_tr = 0.0 running_loss_ts = 0.0 aveGrad = 0 global_step = 0 print("Training Network") # Main Training and Testing Loop for epoch in range(resume_epoch, nEpochs): start_time = timeit.default_timer() if epoch % p['epoch_size'] == p['epoch_size'] - 1: lr_ = utils.lr_poly(p['lr'], epoch, nEpochs, 0.9) print('(poly lr policy) learning rate: ', lr_) optimizer = optim.SGD(net.parameters(), lr=lr_, momentum=p['momentum'], weight_decay=p['wd']) net.train() for ii, sample_batched in enumerate(trainloader): inputs, labels = sample_batched['image'], sample_batched['label'] # Forward-Backward of the mini-batch inputs, labels = Variable(inputs, requires_grad=True), Variable(labels) global_step += inputs.data.shape[0] if gpu_id >= 0: inputs, labels = inputs.cuda(), labels.cuda() outputs = net.forward(inputs) loss = criterion(outputs, labels, size_average=False, batch_average=True) running_loss_tr += loss.item() # Print stuff if ii % num_img_tr == (num_img_tr - 1): running_loss_tr = running_loss_tr / num_img_tr writer.add_scalar('data/total_loss_epoch', running_loss_tr, epoch) print('[Epoch: %d, numImages: %5d]' % (epoch, ii * p['trainBatch'] + inputs.data.shape[0])) print('Loss: %f' % running_loss_tr) running_loss_tr = 0 stop_time = timeit.default_timer() print("Execution time: " + str(stop_time - start_time) + "\n") # Backward the averaged gradient loss /= p['nAveGrad'] loss.backward() aveGrad += 1 # Update the weights once in p['nAveGrad'] forward passes if aveGrad % p['nAveGrad'] == 0: writer.add_scalar('data/total_loss_iter', loss.item(), ii + num_img_tr * epoch) optimizer.step() optimizer.zero_grad() aveGrad = 0 # Show 10 * 3 images results each epoch if ii % (num_img_tr // 10) == 0: grid_image = make_grid(inputs[:3].clone().cpu().data, 3, normalize=True) writer.add_image('Image', grid_image, global_step) grid_image = make_grid(utils.decode_seg_map_sequence(torch.max(outputs[:3], 1)[1].detach().cpu().numpy()), 3, normalize=False, range=(0, 255)) writer.add_image('Predicted label', grid_image, global_step) grid_image = make_grid(utils.decode_seg_map_sequence(torch.squeeze(labels[:3], 1).detach().cpu().numpy()), 3, normalize=False, range=(0, 255)) writer.add_image('Groundtruth label', grid_image, global_step) # Save the model if (epoch % snapshot) == snapshot - 1: torch.save(net.state_dict(), os.path.join(save_dir, 'models', modelName + '_epoch-' + str(epoch) + '.pth')) print("Save model at {}\n".format(os.path.join(save_dir, 'models', modelName + '_epoch-' + str(epoch) + '.pth'))) # One testing epoch if useTest and epoch % nTestInterval == (nTestInterval - 1): total_miou = 0.0 net.eval() for ii, sample_batched in enumerate(testloader): inputs, labels = sample_batched['image'], sample_batched['label'] # Forward pass of the mini-batch inputs, labels = Variable(inputs, requires_grad=True), Variable(labels) if gpu_id >= 0: inputs, labels = inputs.cuda(), labels.cuda() with torch.no_grad(): outputs = net.forward(inputs) predictions = torch.max(outputs, 1)[1] loss = criterion(outputs, labels, size_average=False, batch_average=True) running_loss_ts += loss.item() total_miou += utils.get_iou(predictions, labels) # Print stuff if ii % num_img_ts == num_img_ts - 1: miou = total_miou / (ii * testBatch + inputs.data.shape[0]) running_loss_ts = running_loss_ts / num_img_ts print('Validation:') print('[Epoch: %d, numImages: %5d]' % (epoch, ii * testBatch + inputs.data.shape[0])) writer.add_scalar('data/test_loss_epoch', running_loss_ts, epoch) writer.add_scalar('data/test_miour', miou, epoch) print('Loss: %f' % running_loss_ts) print('MIoU: %f\n' % miou) running_loss_ts = 0 writer.close()
后面文章就会详细讲解这个代码
转载地址:https://blog.csdn.net/zz2230633069/article/details/82867800 如侵犯您的版权,请留言回复原文章的地址,我们会给您删除此文章,给您带来不便请您谅解!
发表评论
最新留言
初次前来,多多关照!
[***.217.46.12]2024年04月19日 03时49分42秒
关于作者
喝酒易醉,品茶养心,人生如梦,品茶悟道,何以解忧?唯有杜康!
-- 愿君每日到此一游!
推荐文章
数组-769. 最多能完成排序的块
2019-04-29
超过256的像素值的保存
2019-04-29
middle-判断二分图-深度优先和广度优先
2019-04-29
二进制补码和原码的记录
2019-04-29
双指针-二分-167. 两数之和 II - 输入有序数组
2019-04-29
双指针-45. 反转字符串中的元音字母
2019-04-29
双指针--环形链表
2019-04-29
python 模块化__init__.py-------__all__
2019-04-29
无重叠区间+用最少数量的箭引爆气球
2019-04-29
买卖股票的最佳时机
2019-04-29
非递减数列
2019-04-29
AUC粗浅理解笔记记录
2019-04-29
分治法:241. 为运算表达式设计优先级
2019-04-29
广度优先遍历:二进制矩阵中的最短路径
2019-04-29
广度优先遍历:set集合的速度远远比list快:完全平方数
2019-04-29
广度+深度:岛屿的最大面积/岛屿数量
2019-04-29
torch 模型运行时间与forward没对应的可能原因
2019-04-29
130. 被围绕的区域
2019-04-29
欧式距离、余弦相似度和余弦距离
2019-04-29
transform 等效转换(参考源码)
2019-04-29