张量流自定义运算梯度

2024-04-14

我们想要在张量流中创建一个自定义层。因此，我们决定简单地从一个玩具示例开始：复制层。经过一番尝试和错误后，我们发现梯度似乎会传递正确的值。然而，在第二次迭代中，特征得到了 NAN。这可能是一个简单的错误，但目前我看不到它。

总的来说，我有两个问题：

有人可以发现这里的问题以及如何解决它吗？
调试张量流会话的好方法是什么？

复制操作.cc

#include "tensorflow/core/framework/op.h"
#include "tensorflow/core/framework/op_kernel.h"
#include <stdio.h>

namespace tensorflow {



typedef Eigen::ThreadPoolDevice CPUDevice;
typedef Eigen::GpuDevice GPUDevice;

template<typename Device, typename T>
class MyCopyOp: public OpKernel {
public:
    explicit MyCopyOp(OpKernelConstruction* context) :
            OpKernel(context) {
    }

    void Compute(OpKernelContext* context) override {
        const Tensor& input = context->input(0);
        auto in_flat = input.flat<T>();

        printf("Debug MyCopyOp Features: %s \n",input.DebugString().c_str());

        Tensor* output = nullptr;
        OP_REQUIRES_OK(context,
                context->allocate_output(0, input.shape(), &output));

        auto out_flat = output->flat<T>();
        out_flat.setZero();

        for (int d = 0; d < input.dims(); ++d) {
            for (int i = 0; i < input.dim_size(d); ++i) {
                out_flat(d * input.dim_size(d) + i) = in_flat(
                        d * input.dim_size(d) + i);
            }
        }

        printf("Debug MyCopyOp Output: %s \n",output->DebugString().c_str());
    }

};


template<typename Device, typename T>
class MyCopyGradOp: public OpKernel {
public:
    explicit MyCopyGradOp(OpKernelConstruction* context) :
            OpKernel(context) {

    }

    void Compute(OpKernelContext* context) override {
        printf("called MyCopyGradOp.Compute() \n");
        const Tensor& gradients = context->input(0);
        const Tensor& features = context->input(1);
        printf("Debug MyCopyOpGrad Gradients: %s \n",gradients.DebugString().c_str());
        printf("Debug MyCopyOpGrad Features: %s \n",features.DebugString().c_str());

        TensorShape output_shape = features.shape();

        Tensor* output = nullptr;
        OP_REQUIRES_OK(context,
                context->allocate_output(0, output_shape, &output));
        output->flat<T>().setZero();

        const T* btm_ptr = gradients.flat<T>().data();
        T* top_ptr = output->flat<T>().data();

        for (int i = 0; i < gradients.NumElements(); ++i) {
            top_ptr[i] = btm_ptr[i];
        }

        printf("Debug MyCopyOpGrad Output: %s \n",output->DebugString().c_str());
        printf("---------------------------------- \n");
    }

};


REGISTER_OP("MyCopy")
.Input("features: T")
.Output("output: T")
.Attr("T: realnumbertype")
.Doc(R"doc(
Copies all input values to the output
)doc");

REGISTER_OP("MyCopyGrad")
.Input("gradients: T")
.Input("features: T")
.Output("backprops: T")
.Attr("T: realnumbertype")
.Doc(R"doc(
TODO!!
)doc");


#define REGISTER_MYCOPY_KERNELS(type)                                           \
  REGISTER_KERNEL_BUILDER(                                                      \
      Name("MyCopy").Device(DEVICE_CPU).TypeConstraint<type>("T"),              \
      MyCopyOp<Eigen::ThreadPoolDevice, type>);                                 \
  REGISTER_KERNEL_BUILDER(                                                      \
      Name("MyCopyGrad").Device(DEVICE_CPU).TypeConstraint<type>("T"),          \
      MyCopyGradOp<Eigen::ThreadPoolDevice, type>);                             //  \
  // REGISTER_KERNEL_BUILDER(                                                      \
  //     Name("MyCopy").Device(DEVICE_GPU).TypeConstraint<type>("T"),              \
  //     MyCopyOp<Eigen::GpuDevice, type>);                                        \
  // REGISTER_KERNEL_BUILDER(                                                      \
  //     Name("MyCopyGrad").Device(DEVICE_GPU).TypeConstraint<type>("T"),          \
  //     MyCopyGradOp<Eigen::GpuDevice, type>);                                


REGISTER_MYCOPY_KERNELS(float); 
REGISTER_MYCOPY_KERNELS(int);
REGISTER_MYCOPY_KERNELS(double);


}

我们使用简单的 MNIST 示例作为基础：

层测试.py

from tensorflow.examples.tutorials.mnist import input_data
mnist = input_data.read_data_sets('MNIST_data', one_hot=True)

import tensorflow as tf
from tensorflow.python.framework import ops
copy_op_module = tf.load_op_library('copy_op.so')

@ops.RegisterGradient("MyCopy")
def _CopyOpGrad(op, grad):
  return copy_op_module.my_copy_grad(grad,op.inputs[0])

sess = tf.InteractiveSession()

x = tf.placeholder(tf.float32, shape=[None, 784])
y_ = tf.placeholder(tf.float32, shape=[None, 10])

W = tf.Variable(tf.zeros([784,10]))
b = tf.Variable(tf.zeros([10]))

sess.run(tf.initialize_all_variables())

y1 = tf.nn.softmax(tf.matmul(x,W) + b)
y = copy_op_module.my_copy(y1)            //Here: MyCopy Layer is inserted

cross_entropy = -tf.reduce_sum(y_*tf.log(y))

train_step = tf.train.GradientDescentOptimizer(0.01).minimize(cross_entropy)

for i in range(2):
  batch = mnist.train.next_batch(50)
  train_step.run(feed_dict={x: batch[0], y_: batch[1]})

correct_prediction = tf.equal(tf.argmax(y,1), tf.argmax(y_,1))
accuracy = tf.reduce_mean(tf.cast(correct_prediction, tf.float32))
print(accuracy.eval(feed_dict={x: mnist.test.images, y_: mnist.test.labels}))

compile

TF_INC=$(python -c 'import tensorflow as tf; print(tf.sysconfig.get_include())')
TF_LIB=$(python -c 'import tensorflow as tf; print(tf.sysconfig.get_lib())')
g++ -std=c++11 -shared copy_op.cc -o copy_op.so -I $TF_INC -L $TF_LIB -fPIC -Wl,-rpath $TF_LIB

output:

Debug MyCopyOp Features: Tensor<type: float shape: [50,10] values: 0.1 0.1 0.1...> 
Debug MyCopyOp Output: Tensor<type: float shape: [50,10] values: 0.1 0.1 0.1...> 
called MyCopyGradOp.Compute() 
Debug MyCopyOpGrad Gradients: Tensor<type: float shape: [50,10] values: -0 -0 -0...> 
Debug MyCopyOpGrad Features: Tensor<type: float shape: [50,10] values: 0.1 0.1 0.1...> 
Debug MyCopyOpGrad Output: Tensor<type: float shape: [50,10] values: -0 -0 -0...> 
---------------------------------- 
Debug MyCopyOp Features: Tensor<type: float shape: [50,10] values: nan nan nan...> 
Debug MyCopyOp Output: Tensor<type: float shape: [50,10] values: nan nan nan...> 
called MyCopyGradOp.Compute() 
Debug MyCopyOpGrad Gradients: Tensor<type: float shape: [50,10] values: nan nan nan...> 
Debug MyCopyOpGrad Features: Tensor<type: float shape: [50,10] values: nan nan nan...> 
Debug MyCopyOpGrad Output: Tensor<type: float shape: [50,10] values: nan nan nan...> 
---------------------------------- 
Debug MyCopyOp Features: Tensor<type: float shape: [10000,10] values: nan nan nan...> 
Debug MyCopyOp Output: Tensor<type: float shape: [10000,10] values: nan nan nan...> 
0.098

预先非常感谢！

来自 mrry 的评论：使用 - 存在已知的稳定性问题tf.reduce_sum(y_ * tf.log(y))计算交叉熵（使用tf.nn.softmax_cross_entropy_with_logits(y, y_)相反），并初始化你的W变量为零通常会导致比随机初始化更糟糕的结果。这个答案 https://stackoverflow.com/questions/36127436/tensorflow-predicts-always-the-same-result/36134261#36134261有关权重初始化问题的更多详细信息。

本文内容由网友自发贡献，版权归原作者所有，本站不承担相应法律责任。如您发现有涉嫌抄袭侵权的内容，请联系:hwhale#tublm.com(使用前将#替换为@)

tensorflow

张量流自定义运算梯度的相关文章

可重用的 Tensorflow 卷积网络

我想重用来自Tensorflow 专业人士的 MNIST CNN 示例 http www tensorflow org tutorials mnist pros index md 我的图像尺寸为 388px X 191px 只有 2 个输出
从 keras 模型中将特征提取到数据集中

我使用以下代码由here https github com keras team keras blob master examples mnist cnn py 运行 CNN 来训练 MNIST 图像 from future import
Keras Maxpooling2d 层给出 ValueError

我正在尝试在 keras 中复制 VGG16 模型以下是我的代码 model Sequential model add ZeroPadding2D 1 1 input shape 3 224 224 model add Convoluti
Keras 中的 Tensorflow 自定义损失函数 - 张量循环

我正在尝试在 Keras 中编写自定义损失函数如下所示 Keras 中的自定义损失函数 https stackoverflow com questions 43818584 custom loss function in keras 我的
应定义密集层输入的最后一个维度。没有找到。收到完整的输入形状：<未知>

我在将模型从一些本地虚拟数据切换到使用 TF 数据集时遇到问题抱歉模型代码太长我已尝试尽可能缩短它以下工作正常 import tensorflow as tf import tensorflow recommenders as tfr
如何在 Windows 上的 Python 2.7 上安装 Tensorflow？

我尝试通过 pip 安装 TensorFlow pip install tensorflow 但是得到这个错误找不到满足tensorflow要求的版本来自版本这个问题有解决办法吗我还是想通过pip安装如果您只因为 Keras 而需
Tensorflow批处理：将结果保留为字符串

这个简单的程序 import tensorflow as tf input string batch tf train batch tf constant input batch size 1 with tf Session as sess
在 Chaquopy 中转换数组和张量

我该怎么做呢我看到你的帖子说你可以将 java 对象传递给 Python 方法但这不适用于 numpy 数组和 TensorFlow 张量以下以及其各种变体是我尝试过的但没有成功 double anchors new double
为什么 get_tensor_by_name 无法正确获取 tf.keras.layers 定义的层的权重

我尝试获取由以下定义的层的权重tf keras layers通过使用get tensor by name in tensorflow 代码如下 encoding utf 8 import tensorflow as tf x tf plac
访问 AWS 上的 Tensorboard

我正在尝试访问 AWS 上的 Tensorboard 这是我的设置张量板 tensorboard host 0 0 0 0 logdir train 在端口 6006 上启动 TensorBoard b 39 您可以导航到http 172
使用批量乘法的tensorflow的tensordot中的障碍

我正在张量流中实现 RBM 使用小批量实现参数更新存在障碍有2个张量第一个张量的形状是 100 3 1 第二个张量的形状是 100 1 4 数字 100 是批次大小所以我想将这些张量相乘得到 100 3 4 张量但是当我实现这样的
TensorFlow：在输入处获取梯度时性能缓慢

我正在使用 TensorFlow 构建一个简单的多层感知器并且我还需要获取神经网络输入损失的梯度或误差信号这是我的代码它有效 cost tf reduce mean tf nn softmax cross entropy with
Keras 通过设置种子获得不同的结果[重复]

这个问题在这里已经有答案了在keras中每次运行都有很高的方差和不稳定的性能为了解决这个问题根据https keras io getting started faq how can i obtain reproducible res
如何在Google机器学习中将jpeg图像转换为json文件

我正在研究 Google Cloud ML 我想对 jpeg 图像进行预测为此我想使用 gcloud beta ml 预测 instances INSTANCES model MODEL version VERSION https cl
错误：tensorflow：无法匹配检查点的文件

我正在训练一个张量流模型在每个时期之后我都会保存模型状态并腌制一些数组到目前为止我的模型执行了 2 个纪元并且保存状态的文件夹包含以下文件 checkpoint model e knihy preprocessed txt e0 c
没有带有张量板的图表

我正在读一本关于 Tensorflow 的书我发现了这段代码 from future import absolute import from future import division from future import print
Keras ImageDataGenerator 相当于 csv 文件

我在文件夹中排序了一堆数据如下图所示我需要构建一个 DataIterator 以便将数据放入神经网络模型中当数据是图像时我找到了很多例子来解决这个问题使用 Keras 类图像数据生成器及其方法流自目录但当数据是 csv 结构时则
Keras ZeroDivisionError：整数除法或以零为模

我正在尝试使用 Keras 和 Tensorflow 实现卷积神经网络我有以下代码 from keras models import Sequential from keras layers import Conv2D MaxPoolin
在 Keras 上使用回调 Tensorboard 时出现 AttributeError：“Model”对象没有属性“run_eagerly”

我已经使用 Keras 的功能 API 构建了一个模型当我将 Tensorboard 实例添加到 model fit 函数的回调中时它会抛出一个错误 AttributeError Model object has no attribut
PIL.Image.open和tf.image.decode_jpeg返回值的区别

我使用 PIL Image open 和 tf image decode jpeg 将图像文件解析为数组但发现PIL Image open 中的像素值与tf image decode jpeg不一样为什么会出现这种情况 Thanks 代

随机推荐

姜戈。复杂的注释需要别名。这里的别名是什么？

我试图通过以下查询获取模型的最大值和最小值 max min price MyModel objects annotate Min price Max price 但我收到错误复杂的注释需要别名我不确定别名在这里意味着什么并且我认为文档
测试助手类的正确位置在哪里？（phpunit/最佳实践）

我想使用 PHPUnit 测试我的应用程序所以我像往常一样有我的应用程序类和第二棵带有测试类的树现在我需要进行一些测试一种虚拟模拟对象我想知道应该将它们放在哪里它是一个不同的用例它应该放在公共 lib 文件夹中还是更喜欢什么
如何使用 FirefoxProfile 在 FireFox Selenium Webdriver 中启用 Adobe Flash

我需要一种自动化方法来在 Firefox Selenium Webdriver 中启用 Flash 而无需用户交互我努力了 FirefoxProfile profile new FirefoxProfile As 0 is to disa
Azure 移动应用自定义身份验证

我正在尝试使用来实现自定义身份验证LoginAsync string provider JObject token MobileServiceClient 的重载我有一个像这样的自定义身份验证控制器 MobileAppController
如何检查事件是否已存在一天 - fullcalendar

如何在使用时检查事件是否已经存在一天renderEvent method 我发现可能在堆栈中回答dayClick with clientEvents 我不确定它如何用于renderEvent var diffDay 5 for var i
如何选择博客模型中的最后一个和倒数第二个条目？

我有一个模型 blog posts 其中有一个字段 published at 我想从该模型中选择最新的两个博客以显示在我的主页上但不确定如何构建它目前我有一个解决方法可以获取一部分数据但当我表中没有任何内容时它会不断失败而不是
ARM架构中不同处理器模式下如何使用内核堆栈？

据我了解每个进程都有一个用户堆栈和内核堆栈除此之外 ARM 架构中的每种模式都有一个堆栈所以我想知道不同的堆栈和堆栈指针在 ARM 模式下如何工作另外何时会使用与进程关联的内核堆栈何时会使用与进程关联的内核堆栈当您进行系统调用
Python 中枚举的枚举？

Python 中是否可以有枚举的枚举例如我想要 enumA enumB elementA elementB enumC elementC elementD 供我参考elementA as enumA enumB elementA 或参考
设置 GLEW 窗口？

我有 Visual Studio 2010 我想在其上设置 glew h 我执行了这一步但仍然出现链接器错误 1 下载glew包 2 将 h文件复制到C Program Files x86 Microsoft SDKs Windows v
Parsley.js - 更改错误容器

我想改变每个错误消息的位置即在相应的位置显示错误消息 div class errorBlock div 通过使用文档代码错误消息显示在元素输入之前而不是按预期显示有任何想法吗根据文档 errors container func
Knex 连接 Heroku Postgres 时出现错误？

我正在尝试将 Heroku Postgres 与 Knex 连接它在本地运行良好但是当我推 Heroku 时并尝试注册一个帐户我收到这个错误 code DEPTH ZERO SELF SIGNED CERT 但我推 Heroku 我
Windows 服务错误 1053

我目前正在编写一个 Windows 服务它连接到 crm 系统以拉下一个计划然后运行各种数据源等我已经一切正常除了当我安装所有内容并尝试运行启动服务时我收到以下错误错误 1053 服务未响应启动或控制请求及时时尚这是我在 S
在 JavaScript 中，await 是否可以保证执行顺序而不需要赋值？

主题我可以说下面的两段代码是相等的吗 await someFunc no assignment here doSomethingAfterSomeFunc and someFunc then gt doSomethingAfterSome
如何在android http POST中添加参数？

friends 我正在尝试使用以下教程将文件上传到 php 服务器http getablogger blogspot com 2008 01 android how to post file to php server html http
添加带有多个小部件链接的右键单击上下文菜单？

我的问题是一种后续行动这个问题 https stackoverflow com questions 12014210 python tkinter app adding a right click context menu 23834156
如何使用标准 MVC Core 依赖注入解析未注册类型

有没有办法得到IServiceProvider GetService
如何在 matplotlib 中的另一个图上添加一个图？

我有两个包含数据的文件 datafile1 和 datafile2 第一个始终存在第二个仅有时存在因此 datafile2 上的数据图被定义为我的 python 脚本中的函数 geom macro 在 datafile1 上的数据绘制代
Visual Studio 忽略 try catch - 仅调试

我认为错误处理是个好主意调试时它可能会妨碍特别是对于用户友好的消息在 VB6 中我只需选中编译器的一个框即可忽略我的错误处理我found https stackoverflow com questions 893277 is th
Mediator/EventAggregator 差异

另外当我需要在松散耦合的对象之间进行通信时例如 MVVM的 ViewModel 有关最佳编程实践的不同书籍和博客建议使用 Mediator EventAggregator 模式我的问题是关于这些模式之间的差异关系谁能为我描述一下它
张量流自定义运算梯度

我们想要在张量流中创建一个自定义层因此我们决定简单地从一个玩具示例开始复制层经过一番尝试和错误后我们发现梯度似乎会传递正确的值然而在第二次迭代中特征得到了 NAN 这可能是一个简单的错误但目前我看不到它总的来说我有两个

张量流自定义运算梯度

张量流自定义运算梯度 的相关文章

随机推荐

热门标签

张量流自定义运算梯度的相关文章