利用keras实现MobileNet,并以mnist数据集作为一个小例子进行识别。使用的环境是:tensorflow-gpu 2.0,python=3.7 , GTX-2070的GPU
- 首先是导入两行魔法命令,可以多行显示.
%config InteractiveShell.ast_node_interactivity="all"
- 加载keras中自带的mnist数据
import tensorflow as tf
import keras
mnist = keras.datasets.mnist
(x_train,y_train),(x_test,y_test) = mnist.load_data()
- 数据的转换
在mnist上下载的数据的分辨率是2828的,mobilenet用来训练的数据是ImageNet ,其图片的分辨率是224224,所以先将图片的维度调整为224*224.
from PIL import Image
import numpy as np
def convert_mnist_224pix(X):
return x
iteration = iter(x_train)
new_train =np.zeros((len(x_train),224,224),dtype=np.float32)
for i in range(len(x_train)):
data = next(iteration)
if i%5000==0:
- 导入所有需要的函数和库
from keras.layers import Conv2D,DepthwiseConv2D,Dense,AveragePooling2D,BatchNormalization,Input
from keras import Model
from keras import Sequential
from keras.layers.advanced_activations import ReLU
from keras.utils import to_categorical
- 自己定义中间可以重复利用的层,将其放在一起,简化搭建网络的重复代码。
def depth_point_conv2d(x,s=[1,1,2,1],channel=[64,128]):
s:the strides of the conv
channel: the depth of pointwiseconvolutions
dw1 = DepthwiseConv2D((3,3),strides=s[0],padding='same')(x)
bn1 = BatchNormalization()(dw1)
relu1 = ReLU()(bn1)
pw1 = Conv2D(channel[0],(1,1),strides=s[1],padding='same')(relu1)
bn2 = BatchNormalization()(pw1)
relu2 = ReLU()(bn2)
dw2 = DepthwiseConv2D((3,3),strides=s[2],padding='same')(relu2)
bn3 = BatchNormalization()(dw2)
relu3 = ReLU()(bn3)
pw2 = Conv2D(channel[1],(1,1),strides=s[3],padding='same')(relu3)
bn4 = BatchNormalization()(pw2)
relu4 = ReLU()(bn4)
return relu4
def repeat_conv(x,s=[1,1],channel=512):
dw1 = DepthwiseConv2D((3,3),strides=s[0],padding='same')(x)
bn1 = BatchNormalization()(dw1)
relu1 = ReLU()(bn1)
pw1 = Conv2D(channel,(1,1),strides=s[1],padding='same')(relu1)
bn2 = BatchNormalization()(pw1)
relu2 = ReLU()(bn2)
return relu2
根据mobilenet论文中的结构进行模型的搭建
- 搭建网络
h1=Conv2D(32,(3,3),strides = 2,padding="same")(h0)
h2= BatchNormalization()(h1)
h4 = depth_point_conv2d(h3,s=[1,1,2,1],channel=[64,128])
h5 = depth_point_conv2d(h4,s=[1,1,2,1],channel=[128,256])
h6 = depth_point_conv2d(h5,s=[1,1,2,1],channel=[256,512])
h7 = repeat_conv(h6)
h8 = repeat_conv(h7)
h9 = repeat_conv(h8)
h10 = repeat_conv(h9)
h11 = depth_point_conv2d(h10,s=[1,1,2,1],channel=[512,1024])
h12 = repeat_conv(h11,channel=1024)
h13 = AveragePooling2D((7,7))(h12)
h14 = Dense(10,activation='softmax')(h13)
model =Model(input=h0,output =h14)
Model: "model_4"
Layer (type) Output Shape Param #
input_11 (InputLayer) (None, 224, 224, 1) 0
conv2d_63 (Conv2D) (None, 112, 112, 32) 320
batch_normalization_120 (Bat (None, 112, 112, 32) 128
re_lu_120 (ReLU) (None, 112, 112, 32) 0
depthwise_conv2d_58 (Depthwi (None, 112, 112, 32) 320
batch_normalization_121 (Bat (None, 112, 112, 32) 128
re_lu_121 (ReLU) (None, 112, 112, 32) 0
conv2d_64 (Conv2D) (None, 112, 112, 64) 2112
batch_normalization_122 (Bat (None, 112, 112, 64) 256
re_lu_122 (ReLU) (None, 112, 112, 64) 0
depthwise_conv2d_59 (Depthwi (None, 56, 56, 64) 640
batch_normalization_123 (Bat (None, 56, 56, 64) 256
re_lu_123 (ReLU) (None, 56, 56, 64) 0
conv2d_65 (Conv2D) (None, 56, 56, 128) 8320
batch_normalization_124 (Bat (None, 56, 56, 128) 512
re_lu_124 (ReLU) (None, 56, 56, 128) 0
depthwise_conv2d_60 (Depthwi (None, 56, 56, 128) 1280
batch_normalization_125 (Bat (None, 56, 56, 128) 512
re_lu_125 (ReLU) (None, 56, 56, 128) 0
conv2d_66 (Conv2D) (None, 56, 56, 128) 16512
batch_normalization_126 (Bat (None, 56, 56, 128) 512
re_lu_126 (ReLU) (None, 56, 56, 128) 0
depthwise_conv2d_61 (Depthwi (None, 28, 28, 128) 1280
batch_normalization_127 (Bat (None, 28, 28, 128) 512
re_lu_127 (ReLU) (None, 28, 28, 128) 0
conv2d_67 (Conv2D) (None, 28, 28, 256) 33024
batch_normalization_128 (Bat (None, 28, 28, 256) 1024
re_lu_128 (ReLU) (None, 28, 28, 256) 0
depthwise_conv2d_62 (Depthwi (None, 28, 28, 256) 2560
batch_normalization_129 (Bat (None, 28, 28, 256) 1024
re_lu_129 (ReLU) (None, 28, 28, 256) 0
conv2d_68 (Conv2D) (None, 28, 28, 256) 65792
batch_normalization_130 (Bat (None, 28, 28, 256) 1024
re_lu_130 (ReLU) (None, 28, 28, 256) 0
depthwise_conv2d_63 (Depthwi (None, 14, 14, 256) 2560
batch_normalization_131 (Bat (None, 14, 14, 256) 1024
re_lu_131 (ReLU) (None, 14, 14, 256) 0
conv2d_69 (Conv2D) (None, 14, 14, 512) 131584
batch_normalization_132 (Bat (None, 14, 14, 512) 2048
re_lu_132 (ReLU) (None, 14, 14, 512) 0
depthwise_conv2d_64 (Depthwi (None, 14, 14, 512) 5120
batch_normalization_133 (Bat (None, 14, 14, 512) 2048
re_lu_133 (ReLU) (None, 14, 14, 512) 0
conv2d_70 (Conv2D) (None, 14, 14, 512) 262656
batch_normalization_134 (Bat (None, 14, 14, 512) 2048
re_lu_134 (ReLU) (None, 14, 14, 512) 0
depthwise_conv2d_65 (Depthwi (None, 14, 14, 512) 5120
batch_normalization_135 (Bat (None, 14, 14, 512) 2048
re_lu_135 (ReLU) (None, 14, 14, 512) 0
conv2d_71 (Conv2D) (None, 14, 14, 512) 262656
batch_normalization_136 (Bat (None, 14, 14, 512) 2048
re_lu_136 (ReLU) (None, 14, 14, 512) 0
depthwise_conv2d_66 (Depthwi (None, 14, 14, 512) 5120
batch_normalization_137 (Bat (None, 14, 14, 512) 2048
re_lu_137 (ReLU) (None, 14, 14, 512) 0
conv2d_72 (Conv2D) (None, 14, 14, 512) 262656
batch_normalization_138 (Bat (None, 14, 14, 512) 2048
re_lu_138 (ReLU) (None, 14, 14, 512) 0
depthwise_conv2d_67 (Depthwi (None, 14, 14, 512) 5120
batch_normalization_139 (Bat (None, 14, 14, 512) 2048
re_lu_139 (ReLU) (None, 14, 14, 512) 0
conv2d_73 (Conv2D) (None, 14, 14, 512) 262656
batch_normalization_140 (Bat (None, 14, 14, 512) 2048
re_lu_140 (ReLU) (None, 14, 14, 512) 0
depthwise_conv2d_68 (Depthwi (None, 14, 14, 512) 5120
batch_normalization_141 (Bat (None, 14, 14, 512) 2048
re_lu_141 (ReLU) (None, 14, 14, 512) 0
conv2d_74 (Conv2D) (None, 14, 14, 512) 262656
batch_normalization_142 (Bat (None, 14, 14, 512) 2048
re_lu_142 (ReLU) (None, 14, 14, 512) 0
depthwise_conv2d_69 (Depthwi (None, 7, 7, 512) 5120
batch_normalization_143 (Bat (None, 7, 7, 512) 2048
re_lu_143 (ReLU) (None, 7, 7, 512) 0
conv2d_75 (Conv2D) (None, 7, 7, 1024) 525312
batch_normalization_144 (Bat (None, 7, 7, 1024) 4096
re_lu_144 (ReLU) (None, 7, 7, 1024) 0
depthwise_conv2d_70 (Depthwi (None, 7, 7, 1024) 10240
batch_normalization_145 (Bat (None, 7, 7, 1024) 4096
re_lu_145 (ReLU) (None, 7, 7, 1024) 0
conv2d_76 (Conv2D) (None, 7, 7, 1024) 1049600
batch_normalization_146 (Bat (None, 7, 7, 1024) 4096
re_lu_146 (ReLU) (None, 7, 7, 1024) 0
average_pooling2d_5 (Average (None, 1, 1, 1024) 0
dense_4 (Dense) (None, 1, 1, 10) 10250
Total params: 3,249,482
Trainable params: 3,227,594
Non-trainable params: 21,888
x_train = np.expand_dims(new_train,3)
y_train = to_categorical(y_train)
y = np.expand_dims(y,1)
- 定义数据生成函数
def data_generate(x_train,y_train,batch_size,epochs):
for i in range(epochs):
batch_num = len(x_train)//batch_size
shuffle_index = np.arange(batch_num)
for j in shuffle_index:
begin = j*batch_size
end =begin+batch_size
x = x_train[begin:end]
y = y_train[begin:end]
yield ({"input_11":x},{"dense_4":y})
- 开始训练
Executing op VarHandleOp in device /job:localhost/replica:0/task:0/device:GPU:0
Epoch 1/10
Executing op __inference_keras_scratch_graph_22639 in device /job:localhost/replica:0/task:0/device:GPU:0
600/600 [==============================] - 411s 684ms/step - loss: 0.1469 - accuracy: 0.9529
Epoch 2/10
600/600 [==============================] - 398s 663ms/step - loss: 0.0375 - accuracy: 0.9884
Epoch 3/10
600/600 [==============================] - 401s 668ms/step - loss: 0.0283 - accuracy: 0.9909
Epoch 4/10
600/600 [==============================] - 399s 665ms/step - loss: 0.0211 - accuracy: 0.9936
Epoch 5/10
600/600 [==============================] - 400s 666ms/step - loss: 0.0216 - accuracy: 0.9932
Epoch 6/10
600/600 [==============================] - 401s 668ms/step - loss: 0.0208 - accuracy: 0.9935
Epoch 7/10
600/600 [==============================] - 401s 669ms/step - loss: 0.0174 - accuracy: 0.9945
Epoch 8/10
131/600 [=====>........................] - ETA: 5:13 - loss: 0.0091 - accuracy: 0.9973
【推荐】国内首个AI IDE,深度理解中文开发场景,立即下载体验Trae
【推荐】轻量又高性能的 SSH 工具 IShell:AI 加持,快人一步
· 记一次.NET内存居高不下排查解决与启示
· 探究高空视频全景AR技术的实现原理
· 理解Rust引用及其生命周期标识(上)
· 浏览器原生「磁吸」效果!Anchor Positioning 锚点定位神器解析
· 没有源码,如何修改代码逻辑?
· 分享4款.NET开源、免费、实用的商城系统
· 全程不用写代码,我用AI程序员写了一个飞机大战
· MongoDB 8.0这个新功能碉堡了,比商业数据库还牛
· 白话解读 Dapr 1.15:你的「微服务管家」又秀新绝活了
· 上周热点回顾(2.24-3.2)