cifar-10-dataset

import cv2

import numpy as np

import os

import pickle

data_dir = os.path.join("data", "cifar-10-batches-py")

train_o_dir = os.path.join("data", "train")

test_o_dir = os.path.join("data", "test")

Train = True   # 不解压训练集，仅解压测试集

# 解压缩，返回解压后的字典

def unpickle(file):

    with open(file, 'rb') as fo:

        dict_ = pickle.load(fo, encoding='bytes')

    return dict_

def my_mkdir(my_dir):

    if not os.path.isdir(my_dir):

        os.makedirs(my_dir)

# 生成训练集图片，

if __name__ == '__main__':

    if Train:

        for j in range(1, 6):

            data_path = os.path.join(data_dir, "data_batch_" + str(j))  # data_batch_12345

            train_data = unpickle(data_path)

            print(data_path + " is loading...")

            for i in range(0, 10000):

                img = np.reshape(train_data[b'data'][i], (3, 32, 32))

                img = img.transpose(1, 2, 0)

                label_num = str(train_data[b'labels'][i])

                o_dir = os.path.join(train_o_dir, "data_batch_" + str(j) ,label_num)

                my_mkdir(o_dir)

                img_name = label_num + '_' + str(i + (j - 1)*10000) + '.png'

                img_path = os.path.join(o_dir, img_name)

                cv2.imwrite(img_path, img)

            print(data_path + " loaded.")

    print("test_batch is loading...")

    # 生成测试集图片

    test_data_path = os.path.join(data_dir, "test_batch")

    test_data = unpickle(test_data_path)

    for i in range(0, 10000):

        img = np.reshape(test_data[b'data'][i], (3, 32, 32))

        img = img.transpose(1, 2, 0)

        label_num = str(test_data[b'labels'][i])

        o_dir = os.path.join(test_o_dir, label_num)

        my_mkdir(o_dir)

        img_name = label_num + '_' + str(i) + '.png'

        img_path = os.path.join(o_dir, img_name)

        cv2.imwrite(img_path, img)

    print("test_batch loaded.")

import sys

import os

my_mkdir("data/traintxt")

#生成batch的txt

data_dir = "data/train/"

datat = "data/traintxt"

for j in range(1, 6):

  data_path = os.path.join(data_dir, "data_batch_" + str(j))  # data_batch_12345

  datatraint = os.path.join(datat, "data_batch_" + str(j) + ".txt")

  ft = open(datatraint, 'w')

  print(data_path)

  for root, s_dirs, _ in os.walk(data_path, topdown=True):  # 获取 train文件下各文件夹名称

      print(s_dirs)

      for sub_dir in s_dirs:

          i_dir = os.path.join(root, sub_dir)             # 获取各类的文件夹 绝对路径

          img_list = os.listdir(i_dir)                    # 获取类别文件夹下所有png图片的路径

          for i in range(len(img_list)):

              if not img_list[i].endswith('png'):         # 若不是png文件，跳过

                  continue

              label = img_list[i].split('_')[0]

              img_path = os.path.join(i_dir, img_list[i])

              line = img_path + ' ' + label + '\n'

              ft.write(line)

ft.close()

#总生成txt

data_dir = "data/train/"

datat = "data"

datatraint = os.path.join(datat, "train.txt")

ft = open(datatraint, 'w')

for j in range(1, 6):

  data_path = os.path.join(data_dir, "data_batch_" + str(j))  # data_batch_12345

  print(data_path)

  for root, s_dirs, _ in os.walk(data_path, topdown=True):  # 获取 train文件下各文件夹名称

      print(s_dirs)

      for sub_dir in s_dirs:

          i_dir = os.path.join(root, sub_dir)             # 获取各类的文件夹 绝对路径

          img_list = os.listdir(i_dir)                 # 获取类别文件夹下所有png图片的路径

          for i in range(len(img_list)):

              if not img_list[i].endswith('png'):         # 若不是png文件，跳过

                  continue

              label = img_list[i].split('_')[0]

              img_path = os.path.join(i_dir, img_list[i])

              line = img_path + ' ' + label + '\n'

              ft.write(line)

ft.close()

#test的txt

data_dir = "data"

datat = "data"

data_path = os.path.join(data_dir, "test")

datatraint = os.path.join(datat, "test.txt")

ft = open(datatraint, 'w')

print(data_path)

for root, s_dirs, _ in os.walk(data_path, topdown=True):  # 获取 test文件下各文件夹名称

    print(s_dirs)

    for sub_dir in s_dirs:

        i_dir = os.path.join(root, sub_dir)             # 获取各类的文件夹 绝对路径

        img_list = os.listdir(i_dir)                 # 获取类别文件夹下所有png图片的路径

        for i in range(len(img_list)):

            if not img_list[i].endswith('png'):         # 若不是png文件，跳过

                continue

            label = img_list[i].split('_')[0]

            img_path = os.path.join(i_dir, img_list[i])

            line = img_path + ' ' + label + '\n'

            ft.write(line)

ft.close()

update from other’s github main.py

'''Train CIFAR10 with PyTorch.'''

import torch

import torch.nn as nn

import torch.optim as optim

import torch.nn.functional as F

import torch.backends.cudnn as cudnn

from torch.utils.data import Dataset

from PIL import Image

import torchvision

import torchvision.transforms as transforms

import os

import argparse

from models import *

from utils import progress_bar

class Mydataset(Dataset):

    def __init__(self,txt_path,transform = None,target_transform = None):

        fh = open(txt_path,'r')

        imgs = []

        for line in fh:

            line = line.rstrip()

            words = line.split()

            imgs.append((words[0],int(words[1])))

            self.imgs = imgs

            self.transform = transform

            self.target_transform = target_transform

    def __getitem__(self,index):

        fn,label = self.imgs[index]

        img = Image.open(fn)

        if self.transform is not None:

            img = self.transform(img)

        return img,label

    def __len__(self):

        return len(self.imgs)

parser = argparse.ArgumentParser(description='PyTorch CIFAR10 Training')

parser.add_argument('--lr', default=0.1, type=float, help='learning rate')

parser.add_argument('--resume', '-r', action='store_true',

                    help='resume from checkpoint')

args = parser.parse_args()

device = 'cuda' if torch.cuda.is_available() else 'cpu'

best_acc = 0  # best test accuracy

start_epoch = 0  # start from epoch 0 or last checkpoint epoch

# Data

print('==> Preparing data..')

transform_train = transforms.Compose([

    transforms.RandomCrop(32, padding=4),

    transforms.RandomHorizontalFlip(),

    transforms.ToTensor(),

    transforms.Normalize((0.4914, 0.4822, 0.4465), (0.2023, 0.1994, 0.2010)),

])

transform_test = transforms.Compose([

    transforms.RandomCrop(32, padding=4),

    transforms.RandomHorizontalFlip(),

    transforms.ToTensor(),

    transforms.Normalize((0.4914, 0.4822, 0.4465), (0.2023, 0.1994, 0.2010)),

])

trainset = Mydataset(txt_path = '/work/aiit/warming/cifar-10-batches-py/train.txt',

                            transform=transform_train)

trainloader = torch.utils.data.DataLoader(

    trainset, batch_size=128, shuffle=True, num_workers=2)

testset = Mydataset(txt_path = '/work/aiit/warming/cifar-10-batches-py/test.txt',

                             transform=transform_test)

testloader = torch.utils.data.DataLoader(

    testset, batch_size=100, shuffle=False, num_workers=2)

classes = ('plane', 'car', 'bird', 'cat', 'deer',

           'dog', 'frog', 'horse', 'ship', 'truck')

# Model

print('==> Building model..')

#net = vgg.VGG('VGG19')

#net = ResNet18()

# net = PreActResNet18()

# net = GoogLeNet()

# net = DenseNet121()

# net = ResNeXt29_2x64d()

# net = MobileNet()

# net = MobileNetV2()

# net = DPN92()

# net = ShuffleNetG2()

#net = SENet18()

# net = ShuffleNetV2(1)

# net = EfficientNetB0()

net = RegNetX_200MF()

net = net.to(device)

if device == 'cuda':

    net = torch.nn.DataParallel(net)

    cudnn.benchmark = True

if args.resume:

    # Load checkpoint.

    print('==> Resuming from checkpoint..')

    assert os.path.isdir('checkpoint'), 'Error: no checkpoint directory found!'

    checkpoint = torch.load('./checkpoint/ckpt.pth')

    net.load_state_dict(checkpoint['net'])

    best_acc = checkpoint['acc']

    start_epoch = checkpoint['epoch']

criterion = nn.CrossEntropyLoss()

optimizer = optim.SGD(net.parameters(), lr=args.lr,

                      momentum=0.9, weight_decay=5e-4)

# Training

def train(epoch):

    print('\nEpoch: %d' % epoch)

    net.train()

    train_loss = 0

    correct = 0

    total = 0

    for batch_idx, (inputs, targets) in enumerate(trainloader):

        inputs, targets = inputs.to(device), targets.to(device)

        optimizer.zero_grad()

        outputs = net(inputs)

        loss = criterion(outputs, targets)

        loss.backward()

        optimizer.step()

        train_loss += loss.item()

        _, predicted = outputs.max(1)

        total += targets.size(0)

        correct += predicted.eq(targets).sum().item()

        progress_bar(batch_idx, len(trainloader), 'Loss: %.3f | Acc: %.3f%% (%d/%d)'

                     % (train_loss/(batch_idx+1), 100.*correct/total, correct, total))

    torch.save(net, './checkpoint/RegNetX_200MF.pth')

def test(epoch):

    global best_acc

    net.eval()

    test_loss = 0

    correct = 0

    total = 0

    with torch.no_grad():

        for batch_idx, (inputs, targets) in enumerate(testloader):

            inputs, targets = inputs.to(device), targets.to(device)

            outputs = net(inputs)

            loss = criterion(outputs, targets)

            test_loss += loss.item()

            _, predicted = outputs.max(1)

            total += targets.size(0)

            correct += predicted.eq(targets).sum().item()

            progress_bar(batch_idx, len(testloader), 'Loss: %.3f | Acc: %.3f%% (%d/%d)'

                         % (test_loss/(batch_idx+1), 100.*correct/total, correct, total))

    # Save checkpoint.

    acc = 100.*correct/total

    if acc > best_acc:

        print('Saving..')

        state = {

            'net': net.state_dict(),

            'acc': acc,

            'epoch': epoch,

        }

        if not os.path.isdir('checkpoint'):

            os.mkdir('checkpoint')

        #torch.save(net, './checkpoint/ckpt1.pth')

        best_acc = acc

for epoch in range(start_epoch, start_epoch+100):

    train(epoch)

    test(epoch)

预测

import torch

import cv2

import torch.nn.functional as F

import sys

sys.path.append('/work/aiit/warming/pytorch-cifar-master/models')

#import vgg

#import torchvision.models as models

#from vgg2 import vgg #重要，虽然显示灰色(即在次代码中没用到)，但若没有引入这个模型代码，加载模型时会找不到模型

from torch.autograd import Variable

from torchvision import datasets, transforms

import numpy as np

classes = ('plane', 'car', 'bird', 'cat', 'deer','dog', 'frog', 'horse', 'ship', 'truck')

if __name__ == '__main__':

    device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')

    #net=models.vgg19(pretrained=False)

    model = (torch.load('/work/aiit/warming/pytorch-cifar-master/checkpoint/RegNetX_200MF.pth')) # 加载模型

    model = model.to(device)

    model.eval() # 把模型转为test模式

    img = cv2.imread("/work/aiit/warming/cifar-10-batches-py/test/1/1_6.png") # 读取要预测的图片

    img=cv2.resize(img,(32,32))

    trans = transforms.Compose(

    [

     transforms.ToTensor(),

     transforms.Normalize(mean=(0.5, 0.5, 0.5), std=(0.5, 0.5, 0.5))

    ])

    img = trans(img)

    img = img.to(device)

    img = img.unsqueeze(0) # 图片扩展多一维,因为输入到保存的模型中是4维的[batch_size,通道,长，宽]，而普通图片只有三维，[通道,长，宽]

    # 扩展后，为[1，1，28，28]

    output = model(img)

    prob = F.softmax(output,dim=1) #prob是10个分类的概率

    print(prob)

    value, predicted = torch.max(output.data, 1)

    #print(predicted.item())

    #print(value)

    pred_class = classes[predicted.item()]

    print(pred_class)

    '''prob = F.softmax(output, dim=1)

    prob = Variable(prob)

    prob = prob.cpu().numpy() # 用GPU的数据训练的模型保存的参数都是gpu形式的，要显示则先要转回cpu，再转回numpy模式

    print(prob) # prob是10个分类的概率

    pred = np.argmax(prob) # 选出概率最大的一个

    print(pred)

    print(pred.item())

    pred_class = classes[pred]

    print(pred_class)'''

cifar-10-dataset的更多相关文章

【翻译】TensorFlow卷积神经网络识别CIFAR 10Convolutional Neural Network (CNN)| CIFAR 10 TensorFlow
原网址:https://data-flair.training/blogs/cnn-tensorflow-cifar-10/ by DataFlair Team · Published May 21, ...
DL Practice：Cifar 10分类
Step 1:数据加载和处理一般使用深度学习框架会经过下面几个流程: 模型定义(包括损失函数的选择)——>数据处理和加载——>训练(可能包括训练过程可视化)——>测试所以自己写代 ...
【神经网络与深度学习】基于Windows+Caffe的Minst和CIFAR—10训练过程说明
Minst训练我的路径:G:\Caffe\Caffe For Windows\examples\mnist 对于新手来说,初步完成环境的配置后,一脸茫然.不知如何跑Demo,有么有!那么接下来的教 ...
PyTorch教程之Training a classifier
我们已经了解了如何定义神经网络,计算损失并对网络的权重进行更新. 接下来的问题就是: 一.What about data? 通常处理图像.文本.音频或视频数据时,可以使用标准的python包将数据加载 ...
TensorLayer官方中文文档1.7.4：API – 数据预处理
所属分类:TensorLayer API - 数据预处理¶ 我们提供大量的数据增强及处理方法,使用 Numpy, Scipy, Threading 和 Queue. 不过,我们建议你直接使用 Tens ...
TensorFlow入门学习(让机器/算法帮助我们作出选择)
catalogue . 个人理解 . 基本使用 . MNIST(multiclass classification)入门 . 深入MNIST . 卷积神经网络:CIFAR- 数据集分类 . 单词的向量 ...
What are some good books/papers for learning deep learning?
What's the most effective way to get started with deep learning? 29 Answers Yoshua Bengio, ...
（转）Awesome PyTorch List
Awesome-Pytorch-list 2018-08-10 09:25:16 This blog is copied from: https://github.com/Epsilon-Lee/Aw ...
[转]最好用的 AI 开源数据集 Top 39：NLP、语音等 6 大类
原文链接本文修正部分错误. 以下是精心收集的一些非常好的开放数据集,也是做 AI 研究不容错过的数据集. 标签解释 [经典]这些是在 AI 领域中非常著名.众所周知的数据集.很少有研究者或工程师没有 ...
深度学习常用数据集 API（包括 Fashion MNIST）
基准数据集深度学习中经常会使用一些基准数据集进行一些测试.其中 MNIST, Cifar 10, cifar100, Fashion-MNIST 数据集常常被人们拿来当作练手的数据集.为了方便,诸如 ...

随机推荐

ZooKeeper3.4.10集群安装配置-Docker
一. 服务器规划主机 IP 端口备注 b-mid-24 172.16.0.24 2181, 2888, 3888 2181:对cline端提供服务 3888:选举leader使用 2888:集群内 ...
ServerlessBench 2.0：华为云联合上海交大发布Serverless基准测试平台
摘要:华为云联合上海交大重磅推出ServerlessBench 2.0,为社区提供涵盖12类基准测试用例.新增5大类跨平台测试用例.4大类关键特性指标.且多平台兼容的Serverless开放基准测试集 ...
HelloWorld入门程序
程序开发步骤说明开发环境搭建完成后我们就可以开发第一个java程序了 java程序开发三步骤:编写.编译.运行编写Java源程序 1.在本地盘目录下新建文本文件,完整的文件名修改为HelloWor ...
Docker默认桥接网络是如何工作的
1. 启动一个Docker容器一般来说,我们起一个容器比如一个简单的nginx服务会向这样 docker run -d --rm nginx:XXX OK容器起来了,但是并不能通过宿主机被外面的机器 ...
Nginx Rewrite资源重定向
# Rewrite功能配置 # Rewrite功能主要是实现了url重写 # 如:你输入www.jd123.com,你可以通过Rewrite让它重定向到www.jd.com # Rewrite的实现依 ...
Linux Shell 自动交互功能
需求背景: 近日,在安装某软件过程,发现在安装过程需要输入一些信息才能继续下一步操作,在机器数量较少情况下,我们可以单台登录上去完成安装操作,但当机器数量超过一定时,如果再手动登录操作,就会产生大 ...
结束语句之 continue
C 语言自学之 continue Dome1:计算1到20之间不能被3整除的数字之和. 运算结果为: sum=147 1 #include<stdio.h> 2 ...
Vue 列动态取值
在前端开发过程中,可能会遇到列动态取值的情况,即列表中某列的取值由两个或以上的字段的值决定. 用 Vue 实现的话可以用如下代码解决 <template slot-scope="sco ...
[SDOI2017]序列计数（矩阵加速，小容斥）
题面 Alice想要得到一个长度为n的序列,序列中的数都是不超过m的正整数,而且这n个数的和是p的倍数. Alice还希望,这n个数中,至少有一个数是质数. Alice想知道,有多少个序列满足她的要求 ...
C#基础_理解类
构造函数主要是用来创建对象时为对象赋初值来初始化对象.总与new运算符一起使用在创建对象的语句中 .A a=new A(); 构造函数具有和类一样的名称:但它是一个函数具有函数的所有特性,同一个类里面 ...

cifar-10-dataset

cifar-10-dataset的更多相关文章

随机推荐

热门专题