ResNet50的猫狗分类训练及预测
相比于之前写的ResNet18,下面的ResNet50写得更加工程化一点,这还适用与其他分类。
我的代码文件结构

1. 数据处理
首先已经对数据做好了分类

文件夹结构是这样
开始划分数据集
split_data.py
import os
import random
import shutil def move_file(target_path, save_train_path, save_val_pathm, scale=0.1): file_list = os.listdir(target_path)
random.shuffle(file_list) number = int(len(file_list) * scale)
train_list = file_list[number:]
val_list = file_list[:number] for file in train_list:
target_file_path = os.path.join(target_path, file)
save_file_path = os.path.join(save_train_path, file)
shutil.copyfile(target_file_path, save_file_path)
for file in val_list:
target_file_path = os.path.join(target_path, file)
save_file_path = os.path.join(save_val_pathm, file)
shutil.copyfile(target_file_path, save_file_path) def split_classify_data(base_path, save_path, scale=0.1):
folder_list = os.listdir(base_path)
for folder in folder_list:
target_path = os.path.join(base_path, folder)
save_train_path = os.path.join(save_path, 'train', folder)
save_val_path = os.path.join(save_path, 'val', folder)
if not os.path.exists(save_train_path):
os.makedirs(save_train_path)
if not os.path.exists(save_val_path):
os.makedirs(save_val_path)
move_file(target_path, save_train_path, save_val_path, scale)
print(folder, 'finish!') if __name__ == '__main__':
base_path = r'C:\Users\Administrator.DESKTOP-161KJQD\Desktop\save_dir'
save_path = r'C:\Users\Administrator.DESKTOP-161KJQD\Desktop\dog_cat'
# 验证集比例
scale = 0.1
split_classify_data(base_path, save_path, scale)
运行完以上代码的到的文件夹结构

一个训练集数据,一个验证集数据
2.数据集的导入
我这个文件写了一个数据集的导入和一个学习率更新的函数。数据导入是通用的
tools.py
import os
import time import cv2
import numpy as np
import torch
import torch.nn as nn
import torch.nn.functional as F
import torch.optim as optim
import torchvision
from torch.autograd.variable import Variable
from torch.utils.tensorboard import SummaryWriter
from torchvision import datasets, transforms
from torch.utils.data import Dataset, DataLoader
from torch.optim.lr_scheduler import ExponentialLR, LambdaLR
from torchvision.models import ResNet50_Weights
from tqdm import tqdm
from classify_cfg import * mean = MEAN
std = STD def get_dataset(base_dir='', input_size=160):
dateset = dict()
transform_train = transforms.Compose([
# 分辨率重置为input_size
transforms.Resize(input_size),
transforms.RandomRotation(15),
# 对加载的图像作归一化处理, 并裁剪为[input_sizexinput_sizex3]大小的图像(因为这图片像素不一致直接统一)
transforms.CenterCrop(input_size),
transforms.ToTensor(),
transforms.Normalize(mean=mean, std=std)
]) transform_val = transforms.Compose([
transforms.Resize(input_size),
transforms.RandomRotation(15),
transforms.CenterCrop(input_size),
transforms.ToTensor(),
transforms.Normalize(mean=mean, std=std)
])
base_dir_train = os.path.join(base_dir, 'train')
train_dataset = datasets.ImageFolder(root=base_dir_train, transform=transform_train)
# print("train_dataset=" + repr(train_dataset[1][0].size()))
# print("train_dataset.class_to_idx=" + repr(train_dataset.class_to_idx))
# print(train_dataset.classes)
classes = train_dataset.classes
# classes = train_dataset.class_to_idx
classes_num = len(train_dataset.classes) base_dir_val = os.path.join(base_dir, 'val')
val_dataset = datasets.ImageFolder(root=base_dir_val, transform=transform_val) dateset['train'] = train_dataset
dateset['val'] = val_dataset return dateset, classes, classes_num def update_lr(epoch, epochs):
"""
假设开始的学习率lr是0.001,训练次数epochs是100
当epoch<33时是lr * 1
当33<=epoch<=66 时是lr * 0.5
当66<epoch时是lr * 0.1
"""
if epoch == 0 or epochs // 3 > epoch:
return 1
elif (epochs // 3 * 2 >= epoch) and (epochs // 3 <= epoch):
return 0.5
else:
return 0.1
3.训练模型
数据集导入好了以后,选择模型,选择优化器等等,然后开始训练。
mytrain.py
import os
import time import cv2
import numpy as np
import torch
import torch.nn as nn
import torch.optim as optim
import torchvision
from torch.autograd.variable import Variable
from torch.utils.tensorboard import SummaryWriter
from torch.utils.data import Dataset, DataLoader
from torch.optim.lr_scheduler import ExponentialLR, LambdaLR
from torchvision.models import ResNet50_Weights
# from tqdm import tqdm
from classify_cfg import *
from tools import get_dataset, update_lr def train(model, dateset, epochs, batch_size, device, optimizer, scheduler, criterion, save_path):
train_loader = DataLoader(dateset.get('train'), batch_size=batch_size, shuffle=True)
val_loader = DataLoader(dateset.get('val'), batch_size=batch_size, shuffle=True) # 保存为tensorboard文件
write = SummaryWriter(save_path)
# 训练过程写入txt
f = open(os.path.join(save_path, 'log.txt'), 'w', encoding='utf-8') best_acc = 0
for epoch in range(epochs):
train_correct = 0.0
model.train()
sum_loss = 0.0
accuracy = -1
total_num = len(train_loader.dataset)
# print(total_num, len(train_loader))
# loop = tqdm(enumerate(train_loader), total=len(train_loader))
batch_count = 0
for batch_idx, (data, target) in enumerate(train_loader):
start_time = time.time()
data, target = Variable(data).to(device), Variable(target).to(device)
output = model(data)
loss = criterion(output, target)
optimizer.zero_grad()
loss.backward()
optimizer.step() print_loss = loss.data.item()
sum_loss += print_loss
train_predict = torch.max(output.data, 1)[1]
if torch.cuda.is_available():
train_correct += (train_predict.cuda() == target.cuda()).sum()
else:
train_correct += (train_predict == target).sum()
accuracy = (train_correct / total_num) * 100
# loop.set_description(f'Epoch [{epoch+1}/{epochs}]')
# loop.set_postfix(loss=loss.item(), acc='{:.3f}'.format(accuracy))
batch_count += len(data)
end_time = time.time()
s = f'Epoch:[{epoch+1}/{epochs}] Batch:[{batch_count}/{total_num}] train_acc: {"{:.2f}".format(accuracy)} ' \
f'train_loss: {"{:.3f}".format(loss.item())} time: {int((end_time-start_time)*1000)} ms'
# print(f'Epoch:[{epoch+1}/{epochs}]', f'Batch:[{batch_count}/{total_num}]',
# 'train_acc:', '{:.2f}'.format(accuracy), 'train_loss:', '{:.3f}'.format(loss.item()),
# 'time:', f'{int((end_time-start_time)*1000)} ms')
print(s)
f.write(s+'\n') write.add_scalar('train_acc', accuracy, epoch)
write.add_scalar('train_loss', loss.item(), epoch)
# print(optimizer.param_groups[0]['lr'])
scheduler.step()
if best_acc < accuracy:
best_acc = accuracy
torch.save(model, os.path.join(save_path, 'best.pt')) if epoch+1 == epochs:
torch.save(model, os.path.join(save_path, 'last.pt')) # 预测验证集
# if (epoch+1) % 5 == 0 or epoch+1 == epochs:
model.eval()
test_loss = 0.0
correct = 0.0
total_num = len(val_loader.dataset)
# print(total_num, len(val_loader))
with torch.no_grad():
for data, target in val_loader:
data, target = Variable(data).to(device), Variable(target).to(device)
output = model(data)
loss = criterion(output, target)
_, pred = torch.max(output.data, 1)
if torch.cuda.is_available():
correct += torch.sum(pred.cuda() == target.cuda())
else:
correct += torch.sum(pred == target)
print_loss = loss.data.item()
test_loss += print_loss
acc = correct / total_num * 100
avg_loss = test_loss / len(val_loader)
s = f"val acc: {'{:.2f}'.format(acc)} val loss: {'{:.3f}'.format(avg_loss)}"
# print('val acc: ', '{:.2f}'.format(acc), 'val loss: ', '{:.3f}'.format(avg_loss))
print(s)
f.write(s+'\n')
write.add_scalar('val_acc', acc, epoch)
write.add_scalar('val_loss', avg_loss, epoch)
# loop.set_postfix(val_loss='{:.3f}'.format(avg_loss), val_acc='{:.3f}'.format(acc)) f.close() if __name__ == '__main__':
device = DEVICE
epochs = EPOCHS
batch_size = BATCH_SIZE
input_size = INPUT_SIZE
lr = LR
# ---------------------------训练-------------------------------------
# 图片的路径
base_dir = r'C:\Users\Administrator.DESKTOP-161KJQD\Desktop\dog_cat'
# 保存的路径
save_path = r'C:\Users\Administrator.DESKTOP-161KJQD\Desktop\dog_cat_save'
dateset, classes, classes_num = get_dataset(base_dir, input_size=input_size)
# model = torchvision.models.resnet50(pretrained=True)
model = torchvision.models.resnet50(weights=ResNet50_Weights.IMAGENET1K_V1)
num_ftrs = model.fc.in_features
model.fc = nn.Linear(num_ftrs, classes_num)
model.to(DEVICE)
# # 损失函数,交叉熵损失函数
criteon = nn.CrossEntropyLoss()
# 选择优化器
optimizer = optim.SGD(model.parameters(), lr=lr)
# 学习率更新
# scheduler = ExponentialLR(optimizer, gamma=0.9)
scheduler = LambdaLR(optimizer, lr_lambda=lambda epoch: update_lr(epoch, epochs))
# 开始训练
train(model, dateset, epochs, batch_size, device, optimizer, scheduler, criteon, save_path)
# 将label保存起来
with open(os.path.join(save_path, 'labels.txt'), 'w', encoding='utf-8') as f:
f.write(f'{classes_num} {classes}')
训练结束以后,在保存路径下会得到下面的文件

最好的模型,最后一次的模型,标签的列表,训练的记录和tensorboard记录
在该路径下执行 tensorboard --logdir=.

然后在浏览器打开给出的地址,即可看到数据训练过程的绘图
4.对图片进行预测
考虑对于用户来说,用户是在网页或者手机上上传一张图片进行预测,所以这边是采用二进制数据。
mypredict.py
import cv2
import numpy as np
import torch from classify_cfg import * def img_process(img_betys, img_size, device): img_arry = np.asarray(bytearray(img_betys), dtype='uint8')
# im0 = cv2.imread(img_betys)
im0 = cv2.imdecode(img_arry, cv2.IMREAD_COLOR)
image = cv2.resize(im0, (img_size, img_size))
image = np.float32(image) / 255.0
image[:, :, ] -= np.float32(mean)
image[:, :, ] /= np.float32(std)
image = image.transpose((2, 0, 1))
im = torch.from_numpy(image).unsqueeze(0)
im = im.to(device)
return im def predict(model_path, img, device):
model = torch.load(model_path)
model.to(device)
model.eval()
predicts = model(img)
# print(predicts)
_, preds = torch.max(predicts, 1)
pred = torch.squeeze(preds)
# print(pred)
return pred if __name__ == '__main__':
mean = MEAN
std = STD
device = DEVICE
classes = ['狗', '猫']
# # 预测
model_path = r'C:\Users\Administrator.DESKTOP-161KJQD\Desktop\dog_cat_save\best.pt'
img_path = r'C:\Users\Administrator.DESKTOP-161KJQD\Desktop\save_dir\狗\000000.jpg'
with open(img_path, 'rb') as f:
img_betys = f.read()
img =img_process(img_betys, 160, device)
# print(img.shape)
# print(img)
pred = predict(model_path, img, device)
print(classes[int(pred)])
ResNet50的猫狗分类训练及预测的更多相关文章
- paddlepaddle实现猫狗分类
目录 1.预备工作 1.1 数据集准备 1.2 数据预处理 2.训练 2.1 模型 2.2 定义训练 2.3 训练 3.预测 4.参考文献 声明:这是我的个人学习笔记,大佬可以点评,指导,不喜勿喷.实 ...
- 人工智能——CNN卷积神经网络项目之猫狗分类
首先先导入所需要的库 import sys from matplotlib import pyplot from tensorflow.keras.utils import to_categorica ...
- 用tensorflow迁移学习猫狗分类
笔者这几天在跟着莫烦学习TensorFlow,正好到迁移学习(至于什么是迁移学习,看这篇),莫烦老师做的是预测猫和老虎尺寸大小的学习.作为一个有为的学生,笔者当然不能再预测猫啊狗啊的大小啦,正好之前正 ...
- 猫狗分类--Tensorflow实现
贴一张自己画的思维导图 数据集准备 kaggle猫狗大战数据集(训练),微软的不需要FQ 12500张cat 12500张dog 生成图片路径和标签的List step1:获取D:/Study/Py ...
- 1.keras实现-->自己训练卷积模型实现猫狗二分类(CNN)
原数据集:包含 25000张猫狗图像,两个类别各有12500 新数据集:猫.狗 (照片大小不一样) 训练集:各1000个样本 验证集:各500个样本 测试集:各500个样本 1= 狗,0= 猫 # 将 ...
- 使用pytorch完成kaggle猫狗图像识别
kaggle是一个为开发商和数据科学家提供举办机器学习竞赛.托管数据库.编写和分享代码的平台,在这上面有非常多的好项目.好资源可供机器学习.深度学习爱好者学习之用.碰巧最近入门了一门非常的深度学习框架 ...
- Kaggle系列1:手把手教你用tensorflow建立卷积神经网络实现猫狗图像分类
去年研一的时候想做kaggle上的一道题目:猫狗分类,但是苦于对卷积神经网络一直没有很好的认识,现在把这篇文章的内容补上去.(部分代码参考网上的,我改变了卷积神经网络的网络结构,其实主要部分我加了一层 ...
- pytorch实现kaggle猫狗识别
参考:https://blog.csdn.net/weixin_37813036/article/details/90718310 kaggle是一个为开发商和数据科学家提供举办机器学习竞赛.托管数据 ...
- 深度学习原理与框架-猫狗图像识别-卷积神经网络(代码) 1.cv2.resize(图片压缩) 2..get_shape()[1:4].num_elements(获得最后三维度之和) 3.saver.save(训练参数的保存) 4.tf.train.import_meta_graph(加载模型结构) 5.saver.restore(训练参数载入)
1.cv2.resize(image, (image_size, image_size), 0, 0, cv2.INTER_LINEAR) 参数说明:image表示输入图片,image_size表示变 ...
- 【猫狗数据集】pytorch训练猫狗数据集之创建数据集
猫狗数据集的分为训练集25000张,在训练集中猫和狗的图像是混在一起的,pytorch读取数据集有两种方式,第一种方式是将不同类别的图片放于其对应的类文件夹中,另一种是实现读取数据集类,该类继承tor ...
随机推荐
- ASP.NET Core 读取配置文件信息
一:读取配置文件 先来看一下appsettings.json文件的内容,如下图: { "ConnectionStrings": { "ServerConnection&q ...
- Unity 转小游戏
填写appid 和游戏资源位置 在导出的项目里可以修改游戏资源位置 两个目录 minigame 是小程序打开的目录 webgl 是要下载的的资源 下载一个http 服务器就有了 和JS交互 大部分js ...
- pip下载时使用国内镜像 设置pip.ini文件
https://blog.csdn.net/u011107575/article/details/109901086 https://www.python.org/ftp/python/https:/ ...
- opengl编程天天踩的坑
1. VBO 的 target 是 GL_ARRAY_BUFFER 不是 GL_VERTEX_BUFFER 2. glUniform()用来给uniform传变量 别用成 glProgramUnif ...
- Eclipse's Content Assist
在Eclipse里面的辅助智能索引只有"."才会提示,或者手动按alt+/补全提示.因为Eclipse的补全功能的默认设置只有".",其实你只需要稍微修改一下就 ...
- iframe页面加载完成为什么还是获取不到里面的dom
iframe页面加载完成为什么还是获取不到里面的dom? 因为Iframe是跨域,跨域的情况下是无法获取到iframe里面的DOM的,即使iframe加载完成,也无法获取到里面的DOM. 有什么方法获 ...
- UIPath踩坑记一UIpath中抓取数据后在tableau中无表头
UIpath抓取数据存在Excel中(Excel 应用程序范围),且已设置表头,但是放到tableau中无表头 更换为"写入范围(工作簿)",同时属性设置必须勾选"添加标 ...
- 排序方法-c语言
在接触过得排序算法中中,较为常见的有冒泡排序.选择排序.归并排序.快速排序法,他们的区别在于稳定性.时间复杂度.空间复杂度等: 现简单复习一下冒泡排序: 思路非常简单,逐个比较相邻的两个元素,前一个元 ...
- 字符串练习1 于是他错误的点名开始了(Trie)
题目链接在这里:P2580 于是他错误的点名开始了 - 洛谷 | 计算机科学教育新生态 (luogu.com.cn) 是一道trie树的板子题,注意理解trie树的每一个节点代表的是一个状态,这个状态 ...
- unity踩坑集锦
1.AB包加载,如果项目没有这个tag,那么就匹配不上,和代码一样.2.unity打包安卓topbar想显示出来怎么做?:不渲染安全区域外 3. unity编辑器报错 : Expanding inv ...