numpy实现cnn

2023-05-16

经过多天的奋战，终于写出了一个完成的cnn框架，里面最主要的还是卷积反向传播这一块

网络架构

用到的包

数据集：minist

这里是随机抽取了1000份做训练集

100份做测试集

整体流程

'''先思考一下，前面的28*28*1的图片那么特征数为784，而对于一张比较小的图片100*100*3（其实100*100*3还是很小的一张图）来说大小特征数为30000那么第一层w就会有30000个
对于这么多参数的优化，时=是非常的浪费时间的，特别是每次迭代时一个batch如果为10即一次只处理10张图片的话，那就更加吃力，那么卷积神经网络
可以很好解决这种情况，看看卷积神经网络的原理--损失函数的定义-参数的优化'''

'''输入层 -- 卷积层 -- 池化层(下采样/压缩) -- 全连接层'''

import numpy as np
import random



def load_data():
    # 训练集
    with open('C:/Users/admin/Desktop/新建文件夹/数据挖掘/机器学习/多层感知机/MINIST_data/train-images.idx3-ubyte') as f:
        loaded = np.fromfile(file=f, dtype=np.uint8)
        train_data = loaded[16:].reshape((60000, 784))
    print(train_data.shape)  # (60000, 784)

    with open('C:/Users/admin/Desktop/新建文件夹/数据挖掘/机器学习/多层感知机/MINIST_data/train-labels.idx1-ubyte') as f:
        loaded = np.fromfile(file=f, dtype=np.uint8)
        train_labels = loaded[8:]
    print(train_labels.shape)  # (60000,)

    # 测试集
    with open('C:/Users/admin/Desktop/新建文件夹/数据挖掘/机器学习/多层感知机/MINIST_data/t10k-images.idx3-ubyte') as f:
        loaded = np.fromfile(file=f, dtype=np.uint8)
        test_data = loaded[16:].reshape((10000, 784))
    print(test_data.shape)  # (10000, 784)

    with open('C:/Users/admin/Desktop/新建文件夹/数据挖掘/机器学习/多层感知机/MINIST_data/t10k-labels.idx1-ubyte') as f:
        loaded = np.fromfile(file=f, dtype=np.uint8)
        test_labels = loaded[8:].reshape((10000))
    print(test_labels.shape)  # (10000,)
    return train_data, train_labels, test_data, test_labels


def max_pooling(array):
    n, m = array.shape
    new_image = np.zeros((int(n / 2), int(m / 2)))
    delta_pooling = np.zeros((n, m))
    for i in range(0, int(n / 2)):
        for j in range(0, int(m / 2)):
            new_image[i][j] = np.max(array[i * 2:i * 2 + 2, j * 2:j * 2 + 2])
            index = np.unravel_index(array[i * 2:i * 2 + 2, j * 2:j * 2 + 2].argmax(),
                                     array[i * 2:i * 2 + 2, j * 2:j * 2 + 2].shape)
            middle = np.zeros((2, 2))
            middle[index[0]][index[1]] = 1
            delta_pooling[i * 2:i * 2 + 2, j * 2:j * 2 + 2] = middle
    return new_image, delta_pooling

def conv_3d(array, kernel, b, stride=1):
    n, h, w = array.shape
    n_1, h_1, w_1 = kernel.shape
    new_image = np.zeros((h - h_1 + 1, w - w_1 + 1))
    delta = np.zeros(kernel.shape)
    for i in range(0, h - h_1 + 1):
        for j in range(0, w - w_1 + 1):
            new_image[i][j] = np.sum(array[:, i:i + h_1, j:j + w_1] * kernel) + b
    return new_image


class Linear(object):
    def __init__(self, input_size, output_size):
        scale = np.sqrt(input_size / 2)

        self.W = np.random.standard_normal((input_size, output_size)) / scale
        self.b = np.random.standard_normal(output_size) / scale

        self.W_grad = np.zeros((input_size, output_size))
        self.b_grad = np.zeros(output_size)

    def forward(self, x):
        self.x = x
        out = np.dot(x, self.W) + self.b
        return out

    def bp(self, delta, lr):
        '''简单的反向传播过程'''
        shape = delta.shape
        self.b_grad = np.sum(delta, axis=0) / shape[0]
        self.W_grad = np.dot(self.x.T, delta) / shape[0]
        new_delta = np.dot(delta, self.W.T)

        self.W -= lr * self.W_grad
        self.b -= lr * self.b_grad

        return new_delta


class Relu(object):
    def forward(self, x):
        self.x = x
        return np.maximum(x, 0)

    def backward(self, delta):
        delta[self.x < 0] = 0
        return delta


class Pooling(object):
    def forward(self, x):
        self.x = x
        shape = self.x.shape
        out = np.zeros((shape[0], shape[1], shape[2] // 2, shape[3] // 2))
        self.delta = np.zeros(shape)
        for i in range(shape[0]):
            for j in range(shape[1]):
                out[i][j], self.delta[i][j] = max_pooling(self.x[i][j])
        return out

    def bp(self, delta):
        shape = self.delta.shape
        for i in range(shape[0]):
            for j in range(shape[1]):
                for n in range(shape[2]):
                    for m in range(shape[3]):
                        if self.delta[i][j][n][m] == 1:
                            self.delta[i][j][n][m] = delta[i][j][n // 2][m // 2]
        return self.delta

    pass


class Softmax(object):
    def forward(self, x, y):
        self.x = x
        shape = self.x.shape
        out = np.exp(self.x - np.max(self.x))
        for i in range(shape[0]):
            sums = np.sum(out[i, :])
            for j in range(shape[1]):
                out[i][j] = out[i][j] / sums
        loss = 0
        delta = np.zeros(shape)
        for i in range(shape[0]):
            delta[i] = out[i] - y[i]
            for j in range(shape[1]):
                loss += - y[i][j] * np.log(out[i][j])
        loss /= shape[0]
        return loss, delta

    pass


class Conv(object):
    def __init__(self, kernel_shape, stride=1):
        n_out, n_in, wk, hk = kernel_shape

        self.stride = stride

        scale = np.sqrt(3 * wk * hk * n_in / n_out)
        self.k = np.random.standard_normal(kernel_shape) / scale
        self.b = np.random.standard_normal(n_out) / scale

        self.k_grad = np.zeros(kernel_shape)
        self.b_grad = np.zeros(n_out)

    def forward(self, x):
        self.x = x
        shape0 = self.x.shape
        shape1 = self.k.shape
        out = np.zeros((shape0[0], shape1[0], shape0[2] - shape1[2] + 1, shape0[3] - shape1[3] + 1))

        for i in range(out.shape[0]):
            for j in range(out.shape[1]):
                out[i][j] = conv_3d(self.x[i], self.k[j], self.b[j])

        return out

    def bp(self, delta, lr):
        shape = delta.shape
        for i in range(shape[0]):
            for j in range(shape[1]):
                for n in range(shape[2]):
                    for m in range(shape[3]):
                        self.k_grad[j] += delta[i, j, n, m] * self.x[i, :, n:n + self.k.shape[2],
                                                              m:m + self.k.shape[3]]
        self.b_grad = np.sum(delta, axis=(0, 2, 3))
        self.k_grad /= shape[0]
        self.b_grad /= shape[0]

        '''计算x的梯度'''
        k_180 = np.rot90(self.k, 2, (2, 3))
        new_delta = np.zeros(self.x.shape)
        shape1 = self.x.shape
        padding = np.zeros(
            (shape1[0], shape[1], self.x.shape[2] + self.k.shape[2] - 1, self.x.shape[3] + self.k.shape[3] - 1))
        pad = (self.x.shape[2] + self.k.shape[2] - 1 - delta.shape[2]) // 2
        for i in range(padding.shape[0]):
            for j in range(padding.shape[1]):
                padding[i][j] = np.pad(delta[i][j], ((pad, pad), (pad, pad)), 'constant')
        k_180 = k_180.swapaxes(0, 1)

        shape0 = padding.shape
        shape1 = k_180.shape
        out = np.zeros((shape0[0], shape1[0], shape0[2] - shape1[2] + 1, shape0[3] - shape1[3] + 1))

        for i in range(out.shape[0]):
            for j in range(out.shape[1]):
                out[i][j] = conv_3d(padding[i], k_180[j], 0)
        self.k -= lr * self.k_grad
        self.b -= lr * self.b_grad
        return out


def get_batchsize(batch_size, N):
    a = []
    b = list(range(N))
    random.shuffle(b)
    for i in range(N):
        l = b[i * batch_size:batch_size * (i + 1)]
        a.append(l)
        if len(l) < batch_size:
            break
    return a


def train():
    N = 1000
    random_index = random.sample(range(train_data.shape[0]), N)
    train_x = train_data[random_index]
    train_y = train_labels[random_index]
    oneHot = np.identity(10)
    train_y = oneHot[train_y]
    train_x = train_x.reshape(N, 1, 28, 28) / 255

    conv1 = Conv(kernel_shape=(6, 1, 5, 5))  # N * 6 * 24 * 24
    relu1 = Relu()
    pool1 = Pooling()  # N * 6 * 12 *12

    conv2 = Conv(kernel_shape=(16, 6, 5, 5))  # N * 16 * 8 * 8
    relu2 = Relu()
    pool2 = Pooling()  # N * 16 * 4 * 4

    linear = Linear(256, 10)

    softmax = Softmax()
    epoch = 10
    batch_size = 10
    lr = 0.01
    for i in range(epoch):
        batch_radom_index = get_batchsize(batch_size, N)
        for n, indexs in enumerate(batch_radom_index):
            if len(indexs) == 0:
                break
            batch_x = train_x[indexs]
            batch_y = train_y[indexs]
            out = conv1.forward(batch_x)
            out = relu1.forward(out)
            out = pool1.forward(out)

            out = conv2.forward(out)
            out = relu2.forward(out)
            out = pool2.forward(out)

            out = out.reshape(batch_size, -1)

            out = linear.forward(out)
            loss, delta = softmax.forward(out, batch_y)

            delta = linear.bp(delta, lr)
            delta = delta.reshape((batch_size, 16, 4, 4))

            delta = pool2.bp(delta)
            delta = relu2.backward(delta)
            delta = conv2.bp(delta, lr)

            delta = pool1.bp(delta)
            delta = relu1.backward(delta)
            conv1.bp(delta, lr)

            print("Epoch-{}-{:05d}".format(str(i), n), ":", "loss:{:.4f}".format(loss))
        lr *= 0.95 ** (i + 1)  # 学习率指数衰减
        np.savez("data.npz", k1=conv1.k, b1=conv1.b, k2=conv2.k, b2=conv2.b, w3=linear.W, b3=linear.b)


def test():
    r = np.load("data.npz")  # 载入训练好的参数
    N = 100
    random_index = random.sample(range(test_data.shape[0]), N)
    test_x = test_data[random_index]
    test_y = test_labels[random_index]
    # oneHot = np.identity(10)
    # test_y = oneHot[test_y]
    test_x = test_x.reshape(len(test_x), 1, 28, 28) / 255.  # 归一化

    conv1 = Conv(kernel_shape=(6, 1, 5, 5))  # N * 6 * 24 * 24
    relu1 = Relu()
    pool1 = Pooling()  # N * 6 * 12 *12

    conv2 = Conv(kernel_shape=(16, 6, 5, 5))  # N * 16 * 8 * 8
    relu2 = Relu()
    pool2 = Pooling()  # N * 16 * 4 * 4

    nn = Linear(256, 10)
    softmax = Softmax()

    conv1.k = r["k1"]
    conv1.b = r["b1"]
    conv2.k = r["k2"]
    conv2.b = r["b2"]
    nn.W = r["w3"]
    nn.b = r["b3"]

    out = conv1.forward(test_x)
    out = relu1.forward(out)
    out = pool1.forward(out)
    out = conv2.forward(out)
    out = relu2.forward(out)
    out = pool2.forward(out)

    out = out.reshape(N, -1)

    out = nn.forward(out)
    num = 0
    for i in range(N):
        if np.argmax(out[i, :]) == test_y[i]:
            num += 1
    print("TEST-ACC: ", num / N * 100, "%")


train_data, train_labels, test_data, test_labels = load_data()
if __name__ == '__main__':
    test()

准备下一步RNN了

本文内容由网友自发贡献，版权归原作者所有，本站不承担相应法律责任。如您发现有涉嫌抄袭侵权的内容，请联系:hwhale#tublm.com(使用前将#替换为@)

NumPy

cnn

numpy实现cnn 的相关文章

DataFrame 中的字符串，但 dtype 是对象

为什么 Pandas 告诉我我有对象尽管所选列中的每个项目都是一个字符串即使在显式转换之后也是如此这是我的数据框
本地设置的 Cython 编译器指令是否影响一个或所有函数？

我正在努力使用 Cython 加速一些 Python Numpy 代码并且对本地设置如定义的here http docs cython org en latest src reference compilation html在文档中
Pytesseract，尝试检测屏幕上的文本

我将 MSS 与 pytesseract 结合使用尝试在屏幕上读取以确定正在监视的区域中的字符串我的代码如下 import Image import pytesseract import cv2 import os import mss
Buildozer Numpy RuntimeError：工具链损坏：无法链接简单的 C 程序

用 Python 编写我的第一个 Android 应用程序并使用 Buildozer 对其进行打包因为稍后在项目中需要使用numpy 所以我尝试打包以下测试代码 import numpy import kivy kivy require
将索引数组转换为 NumPy 中的 one-hot 编码数组

给定一个一维索引数组 a array 1 0 3 我想将其一次性编码为二维数组 b array 0 1 0 0 1 0 0 0 0 0 0 1 创建归零数组b有足够的列即a max 1 然后对于每一行i 设置a i 第列至1 gt
如何获取所有数字列（嵌套与否）的“.describe()”统计信息？

获取数据帧或列表或数组中任何列的简单描述性统计数据的最佳方法是什么无论是否嵌套一种高级 df describe 还包括带有数值的嵌套结构就我而言我有一个包含许多列的数据框有些列的每一行都有一个数字列表在我的例子中是时间序列结
获取 numpy 数组的多个轴的平均值

在 numpy 中是否有一种快速计算多轴平均值的方法我正在计算 n 维数组除 0 轴之外的所有轴的平均值我目前正在做这个 for i in range d ndim 1 d d mean axis 1 我想知道是否有一个不使用 pyth
NumPy 根据另一个数组中的值对第三个数组中的每个匹配元素求和一个数组

我有两个 numpy 数组一个包含值另一个包含每个值类别 values np array 1 2 3 4 5 6 7 8 9 10 valcats np array 101 301 201 201 102 302 302 202 102
在python中将二维数组转换为彩色图像

我有这样的二维整数列表 list1 1 30 50 21 45 9 97 321 100 接下来我将把它转换为 numpy 数组 myarr np asarray list1 接下来我将使用 PIL 将其转换为图像如下所示 img Ima
如何将元组附加到 numpy 数组而不按元素执行？

如果我尝试 x np append x 2 3 元组 2 3 不会附加到数组的末尾而是2 and 3单独附加即使我最初声明x as x np array dtype tuple or x np array dtype int 2 执行此
由于“环境错误：[错误 13]：权限被拒绝：'usr/local/bin/f2py'”而无法安装软件包

我正在尝试在 macOS X 上安装 numpy 但执行命令后pip install numpy我收到错误环境错误错误13 权限被拒绝 usr local bin f2py 我如何解决它这对我有用 pip3 install user
如何计算总和的平方和？

我有一笔款项需要加快处理速度在一种情况下是 S x y k l Fu ku Fv lv Fx kx Fy ly 另一种情况是 S x y S k l Fu ku Fv lv Fx kx Fy ly 2 注意 S indices 是这些索引
Unpivot Pandas 数据

我目前有一个DataFrame布置为 Jan Feb Mar Apr 2001 1 12 12 19 2002 9 2003 我想将数据逆透视使其看起来像 Date Value Jan 2001 1 Feb 2001 1 Mar 200
为神经网络打乱两个 numpy 数组

我有两个 numpy 数组用于输入数据 X 和输出数据 y X np array 2 3 sample 1 x 16 4 dtype float sample 2 x y np array 1 0 sample 1 y 0 1 dtype
NumPy 和 SciPy - .todense() 和 .toarray() 之间的区别

我想知道使用是否有什么区别优点缺点 toarray vs todense 在稀疏 NumPy 数组上例如 import scipy as sp import numpy as np sparse m sp sparse bsr mat
高效创建抗锯齿圆形蒙版

我正在尝试创建抗锯齿加权而不是布尔圆形掩模以制作用于卷积的圆形内核 radius 3 no of pixels to be 1 on either side of the center pixel shall be decimal a
如何修复 TypeError: G 必须是 'd' 矩阵？

目标尝试通过优化过程运行玩具数据集我遇到以下错误 TypeError Traceback most recent call last
使用步幅沿轴填充每个切片上的对角线

考虑 numpy 数组a a np arange 18 reshape 2 3 3 print a 0 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 我想沿着每个切片的对角线填充axis 0我使用以下方
numpy python 中的“AttributeError：'matrix'对象没有属性'strftime'”错误

我有一个维度为 72000 1 的矩阵该矩阵涉及时间戳我想使用 strftime 如下所示 strftime d m y 为了得到像这样的输出 11 03 02 我有这样一个矩阵 M np matrix timestamps 我使用了
计算互相关函数？

In R 我在用ccf or acf计算成对互相关函数以便我可以找出哪个移位给我带来最大值从它的外观来看 R给我一个标准化的值序列 Python 的 scipy 中是否有类似的东西或者我应该使用fft模块目前我正在这样做 xcor

随机推荐

Centos8安装JDK

官网下载页 xff1a https www oracle com java technologies downloads 选择自己需要的JDK版本进行下载即可一下载上传 https docs oracle com javase 8 do
linux操作系统关机命令

关机命令在linux中关机命令有以下几个 shutdow shutdown命令安全地将系统关机有些用户会使用直接断掉电源的方式来关闭linux xff0c 这是十分危险的因为linux与windows不同 xff0c 其后台运行着许
.eslintrc.js文件内容/配置eslint/eslint参数

首先放一个官网的链接 List of available rules ESLint中文文档然后直接上代码这里以vue项目为例 xff0c 主要两个文件 xff0c 1是 eslintrc js文件 xff08 配置 xff09 xff0
【python】使用pyinstaller将程序打包为exe文件

前言 xff1a 如何将python的 py文件打包为exe文件 xff0c 以打包单独文件的简单程序和打包基于pygame库编写的多模块程序为例 xff0c 以及如何处理素材文件使打包后的文件可以正常运行 xff0c 还有一些总结 x
关于AndroidStudio添加一个新的Activity但没有配置或者模拟器无法打开app的问题

今天原本打算测试一下是否可以用图片imageView当做一个点击事件使用 xff0c 于是我建立了一个新的Activity xff0c 结果折腾了大半天启动的时候发现模拟器怎么都无法打开那个app xff0c 检查了一下注册表已经存在这个a
k8s资源清单创建pod、deployment、service

资源清单配置 pod yaml span class token comment 暴露端口可以进行访问 span span class token punctuation span root 64 master span class tok
windows和ubuntu双系统怎么设置默认启动windows选项

首先获得管理员权限才能修改 sudo su 打开相应目录 cd etc default 打开编辑界面 sudo gedit grub 把下面一段代码中的 GRUB DEFAULT 61 0 中的 0 改为你的windows系统在引导界面所在
解决ubuntu18.04&windows10双系统时间不同步问题（在ubuntu环境下使用）

sudo apt get install ntpdate sudo ntpdate time windows com sudo hwclock localtime systohc
ROS Melodic 安装（ubuntu18.04）

因为后面需要用到python所以我先安装一下 xff0c 不安装应该也行 sudo apt get install python 设置sources list sudo sh c 39 echo 34 deb http packages r
ubuntu双系统怎么完全删除ubuntu系统（主要是删除引导）

必备基础 xff1a 会制作和简单的使用PE系统 xff0c 以下操作均需要在PE中完成步骤 1 首先你要用U盘制作一个可以使用的PE系统 xff08 推荐使用微PE xff09 2 进入PE系统中把ubuntu对应的分区全部删除 xff
arch安装wps

输入以下命令即可 yay S wps office mui zh cn wps office mime cn wps office cn wps office fonts ttf ms fonts ttf wps fonts
oh-my-posh 配置powershell

写这篇文章记录的原因就是因为很多关于oh my posh的之前的配置教程已经不适用 xff0c 特此记录下来打开powershell输入 winget span class token function install span JanD
后端开发工具有哪些

标题后端开发工具有哪些 1 阿尔萨斯Java在线诊断工具 Arthas是一款用于Java应用程序的在线诊断工具 xff0c 由阿里巴巴于2018年9月开源 2 Cloud Toolkit IDE插件 Cloud Toolkit是一个集成开
启动Zookeper时出现闪退现象

这里写自定义目录标题最近在回顾项目的时候遇到zookeeper闪退问题第一步 xff1a 查找问题原因第二步 xff1a 解决问题最近在回顾项目的时候遇到zookeeper闪退问题最近打算复习一下之前写的项目 xff0c 却在启动zo
详解基数排序

1 基数排序基数排序是一种特殊的排序方式 xff0c 不是基于比较进行排序 xff0c 而是基于关键字的各个位置大小进行 34 分配 34 和 34 收集 34 两种操作对关键字序列进行排序的一种排序方式基数排序可以分为 xff1a 最
Maven基础教程

文章目录一 jar包 xff08 一 xff09 打开一个jar包 xff08 二 xff09 打包一个jar包二 Maven xff08 一 xff09 概述 xff08 二 xff09 仓库与坐标本地仓库第三方仓库 xff08
重启策略，健康检查，环境变量，初始化容器

重启策略简介 Always 当容器终止退出后 xff0c 总是重启容器 xff0c 默认策略 OnFailure 当容器异常退出退出状态码非0 时 xff0c 才重启容器 Never 当容器终止退出 xff0c 从不重启容器 span
用两种方法求阶乘的累加和（1050: 阶乘的累加和）

题目描述求1 43 2 43 n 输入输入一个整数n xff0c 你可以假定n不大于10 输出输出一个整数 xff0c 即阶乘累加的结果 xff0c 单独占一行样例输入 4 样例输出 33 方法一 xff1a 用for的循环两次 s
小白一起学Android studio 创建项目

本人也是在学习Android Studio xff0c 就想把自己熟悉的记录一下我用的是Android Studio是 2021 1 1 Patch 2版本 xff1b 1 点击New Project 2 选择Empty Activity
numpy实现cnn

经过多天的奋战 xff0c 终于写出了一个完成的cnn框架 xff0c 里面最主要的还是卷积反向传播这一块网络架构用到的包数据集 xff1a minist 这里是随机抽取了1000份做训练集 100份做测试集整体流程 39 39 3

numpy实现cnn

numpy实现cnn 的相关文章

随机推荐

热门标签