Tensorflow 汇总合并错误：形状 [-1,784] 具有负尺寸

2023-11-26

我试图总结下面神经网络的训练过程。

import tensorflow as tf 
import numpy as np 

from tensorflow.examples.tutorials.mnist import input_data

mnist = input_data.read_data_sets(".\MNIST",one_hot=True)

# Create the model
def train_and_test(hidden1,hidden2, learning_rate, epochs, batch_size):

    with tf.name_scope("first_layer"):
        input_data = tf.placeholder(tf.float32, [batch_size, 784], name = "input")
        weights1  = tf.Variable(
        tf.random_normal(shape =[784, hidden1],stddev=0.1),name = "weights")
        bias = tf.Variable(tf.constant(0.0,shape =[hidden1]), name = "bias")
        activation = tf.nn.relu(
        tf.matmul(input_data, weights1) + bias, name = "relu_act")
        tf.summary.histogram("first_activation", activation)

    with tf.name_scope("second_layer"):
        weights2  = tf.Variable(
        tf.random_normal(shape =[hidden1, hidden2],stddev=0.1),
        name = "weights")
        bias2 = tf.Variable(tf.constant(0.0,shape =[hidden2]), name = "bias")
        activation2 = tf.nn.relu(
        tf.matmul(activation, weights2) + bias2, name = "relu_act")
        tf.summary.histogram("second_activation", activation2)

    with tf.name_scope("output_layer"):
        weights3 = tf.Variable(
            tf.random_normal(shape=[hidden2, 10],stddev=0.5), name = "weights")
        bias3 = tf.Variable(tf.constant(1.0, shape =[10]), name = "bias")
        output = tf.add(
        tf.matmul(activation2, weights3, name = "mul"), bias3, name = "output")
        tf.summary.histogram("output_activation", output)
    y_ = tf.placeholder(tf.float32, [batch_size, 10])

    with tf.name_scope("loss"):
        cross_entropy = tf.reduce_mean(
        tf.nn.softmax_cross_entropy_with_logits(labels=y_, logits=output))
        tf.summary.scalar("cross_entropy", cross_entropy)
    with tf.name_scope("train"):
        train_step = tf.train.GradientDescentOptimizer(learning_rate).minimize(cross_entropy)

    with tf.name_scope("tests"):
        correct_prediction = tf.equal(tf.argmax(output, 1), tf.argmax(y_, 1))
        accuracy = tf.reduce_mean(tf.cast(correct_prediction, tf.float32))

    summary_op = tf.summary.merge_all()

    sess = tf.InteractiveSession()
    writer = tf.summary.FileWriter("./data", sess.graph)
    tf.global_variables_initializer().run()

    # Train
    for i in range(epochs):
        batch_xs, batch_ys = mnist.train.next_batch(batch_size)
         _, summary = sess.run([train_step,summary_op], feed_dict={input_data: batch_xs, y_: batch_ys})
     writer.add_summary(summary)

     if i % 10 ==0:
          test_xs, test_ys = mnist.train.next_batch(batch_size)
          test_accuracy = sess.run(accuracy, feed_dict = {input_data : test_xs, y_ : test_ys})
    writer.close()
    return test_accuracy

if __name__ =="__main__":
print(train_and_test(500, 200, 0.001, 10000, 100))

我每 10 个步骤都会使用一批随机测试数据来测试模型。问题出在夏日作家身上。 for 循环内的 sess.run() 抛出以下错误。

    Traceback (most recent call last):

  File "<ipython-input-18-78c88c8e6471>", line 1, in <module>
    runfile('C:/Users/Suman 
Nepal/Documents/Projects/MNISTtensorflow/mnist.py', wdir='C:/Users/Suman 
Nepal/Documents/Projects/MNISTtensorflow')

  File "C:\Users\Suman Nepal\Anaconda3\lib\site-
packages\spyder\utils\site\sitecustomize.py", line 880, in runfile
execfile(filename, namespace)

  File "C:\Users\Suman Nepal\Anaconda3\lib\site-
packages\spyder\utils\site\sitecustomize.py", line 102, in execfile
exec(compile(f.read(), filename, 'exec'), namespace)

  File "C:/Users/Suman Nepal/Documents/Projects/MNISTtensorflow/mnist.py", line 68, in <module>
    print(train_and_test(500, 200, 0.001, 100, 100))

  File "C:/Users/Suman Nepal/Documents/Projects/MNISTtensorflow/mnist.py", line 58, in train_and_test
    _, summary = sess.run([train_step,summary_op], feed_dict={input_data: batch_xs, y_: batch_ys})

  File "C:\Users\Suman Nepal\Anaconda3\lib\site-packages\tensorflow\python\client\session.py", line 789, in run
    run_metadata_ptr)

  File "C:\Users\Suman Nepal\Anaconda3\lib\site-packages\tensorflow\python\client\session.py", line 997, in _run
feed_dict_string, options, run_metadata)

  File "C:\Users\Suman Nepal\Anaconda3\lib\site-packages\tensorflow\python\client\session.py", line 1132, in _do_run
target_list, options, run_metadata)

  File "C:\Users\Suman Nepal\Anaconda3\lib\site-packages\tensorflow\python\client\session.py", line 1152, in _do_call
raise type(e)(node_def, op, message)

InvalidArgumentError: Shape [-1,784] has negative dimensions
 [[Node: first_layer_5/input = Placeholder[dtype=DT_FLOAT, shape=[?,784], _device="/job:localhost/replica:0/task:0/cpu:0"]()]]

Caused by op 'first_layer_5/input', defined at:
  File "C:\Users\Suman Nepal\Anaconda3\lib\site-packages\spyder\utils\ipython\start_kernel.py", line 231, in <module>
main()
  File "C:\Users\Suman Nepal\Anaconda3\lib\site-packages\spyder\utils\ipython\start_kernel.py", line 227, in main
kernel.start()
  File "C:\Users\Suman Nepal\Anaconda3\lib\site-packages\ipykernel\kernelapp.py", line 477, in start
ioloop.IOLoop.instance().start()
  File "C:\Users\Suman Nepal\Anaconda3\lib\site-packages\zmq\eventloop\ioloop.py", line 177, in start
super(ZMQIOLoop, self).start()
  File "C:\Users\Suman Nepal\Anaconda3\lib\site-packages\tornado\ioloop.py", line 888, in start
handler_func(fd_obj, events)
  File "C:\Users\Suman Nepal\Anaconda3\lib\site-packages\tornado\stack_context.py", line 277, in null_wrapper
return fn(*args, **kwargs)
  File "C:\Users\Suman Nepal\Anaconda3\lib\site-packages\zmq\eventloop\zmqstream.py", line 440, in _handle_events
self._handle_recv()
  File "C:\Users\Suman Nepal\Anaconda3\lib\site-packages\zmq\eventloop\zmqstream.py", line 472, in _handle_recv
self._run_callback(callback, msg)
  File "C:\Users\Suman Nepal\Anaconda3\lib\site-packages\zmq\eventloop\zmqstream.py", line 414, in _run_callback
callback(*args, **kwargs)
  File "C:\Users\Suman Nepal\Anaconda3\lib\site-packages\tornado\stack_context.py", line 277, in null_wrapper
return fn(*args, **kwargs)
 File "C:\Users\Suman Nepal\Anaconda3\lib\site-packages\ipykernel\kernelbase.py", line 283, in dispatcher
return self.dispatch_shell(stream, msg)
 File "C:\Users\Suman Nepal\Anaconda3\lib\site-packages\ipykernel\kernelbase.py", line 235, in dispatch_shell
handler(stream, idents, msg)
  File "C:\Users\Suman Nepal\Anaconda3\lib\site-packages\ipykernel\kernelbase.py", line 399, in execute_request
user_expressions, allow_stdin)
  File "C:\Users\Suman Nepal\Anaconda3\lib\site-packages\ipykernel\ipkernel.py", line 196, in do_execute
res = shell.run_cell(code, store_history=store_history, silent=silent)
  File "C:\Users\Suman Nepal\Anaconda3\lib\site-packages\ipykernel\zmqshell.py", line 533, in run_cell
return super(ZMQInteractiveShell, self).run_cell(*args, **kwargs)
  File "C:\Users\Suman Nepal\Anaconda3\lib\site-packages\IPython\core\interactiveshell.py", line 2717, in run_cell
interactivity=interactivity, compiler=compiler, result=result)
  File "C:\Users\Suman Nepal\Anaconda3\lib\site-packages\IPython\core\interactiveshell.py", line 2827, in run_ast_nodes
if self.run_code(code, result):
  File "C:\Users\Suman Nepal\Anaconda3\lib\site-packages\IPython\core\interactiveshell.py", line 2881, in run_code
exec(code_obj, self.user_global_ns, self.user_ns)
  File "<ipython-input-8-78c88c8e6471>", line 1, in <module>
runfile('C:/Users/Suman Nepal/Documents/Projects/MNISTtensorflow/mnist.py', wdir='C:/Users/Suman Nepal/Documents/Projects/MNISTtensorflow')
  File "C:\Users\Suman Nepal\Anaconda3\lib\site-packages\spyder\utils\site\sitecustomize.py", line 880, in runfile
execfile(filename, namespace)
  File "C:\Users\Suman Nepal\Anaconda3\lib\site-packages\spyder\utils\site\sitecustomize.py", line 102, in execfile
exec(compile(f.read(), filename, 'exec'), namespace)
  File "C:/Users/Suman Nepal/Documents/Projects/MNISTtensorflow/mnist.py", line 86, in <module>
  File "C:/Users/Suman Nepal/Documents/Projects/MNISTtensorflow/mnist.py", line 12, in train_and_test
   input_data = tf.placeholder(tf.float32, [None, 784], name = "input")
  File "C:\Users\Suman Nepal\Anaconda3\lib\site-packages\tensorflow\python\ops\array_ops.py", line 1530, in placeholder
return gen_array_ops._placeholder(dtype=dtype, shape=shape, name=name)
  File "C:\Users\Suman Nepal\Anaconda3\lib\site-packages\tensorflow\python\ops\gen_array_ops.py", line 1954, in _placeholder
name=name)
  File "C:\Users\Suman Nepal\Anaconda3\lib\site-packages\tensorflow\python\framework\op_def_library.py", line 767, in apply_op
op_def=op_def)
  File "C:\Users\Suman Nepal\Anaconda3\lib\site-packages\tensorflow\python\framework\ops.py", line 2506, in create_op
original_op=self._default_original_op, op_def=op_def)
  File "C:\Users\Suman Nepal\Anaconda3\lib\site-packages\tensorflow\python\framework\ops.py", line 1269, in __init__
self._traceback = _extract_stack()

InvalidArgumentError (see above for traceback): Shape [-1,784] has negative dimensions
     [[Node: first_layer_5/input = Placeholder[dtype=DT_FLOAT, shape=[?,784], _device="/job:localhost/replica:0/task:0/cpu:0"]()]]

如果我删除了所有摘要编写者和摘要，则模型运行良好。你能帮我找出这里的问题吗？我尝试操纵张量的形状但一无所获。

来自原始海报的已删除答案的一条评论：

我实际上在下面构建了一个神经网络with tf.Graph() as g。我删除了交互式会话并开始会话with tf.Session(g) as sess。它解决了问题。

图表g没有以这种方式标记为默认图，因此会话 (tf.InteractiveSession在原始代码中）将使用另一个图表来代替。

请注意，由于相同的错误消息，我偶然发现了这里。就我而言，我无意中遇到了这样的事情：

input_data = tf.placeholder(tf.float32, shape=(None, 50))
input_data = tf.tanh(input_data)
session.run(..., feed_dict={input_data: ...})

IE。我没有喂占位符。似乎其他一些张量运算可能会导致此令人困惑的错误，因为内部未定义的维度表示为 -1。

本文内容由网友自发贡献，版权归原作者所有，本站不承担相应法律责任。如您发现有涉嫌抄袭侵权的内容，请联系:hwhale#tublm.com(使用前将#替换为@)

tensorflow

tensorboard

Tensorflow 汇总合并错误：形状 [-1,784] 具有负尺寸的相关文章

Tensorflow 数据 API - 预取

我正在尝试使用 TF 的新功能即 Data API 但我不知道如何使用prefetch作品在下面的代码中 def dataset input fn dataset tf data TFRecordDataset filenames co
如何使用 TFlearn 中的 ImageAugmentation 训练 CNN 中的图像和数据混合

我想使用图像像素信息和数据的混合在 Tflearn Tensorflow 中训练卷积神经网络由于我的图像数量较少因此我需要使用图像增强来增加传递到网络的图像样本数量但这意味着我只能传递图像数据作为输入数据必须在稍后阶段大概在全
TensorFlow.js 调整 3D 张量大小

我有一个具有以下尺寸的 3D 张量宽度 x 高度 x 深度我需要将可变大小的体积调整为特定形状例如 256 x 256 x 256 不幸的是在 TensorFlow js 中他们有一组用于调整大小的方法例如tf image re
如何使用 keras.backend.gradients() 获取梯度值

我试图获得 Keras 模型的输出相对于模型输入 x 而不是权重的导数似乎最简单的方法是使用 keras backend 中的梯度它返回梯度张量 https keras io backend https keras io backe
TensorFlow CUDA_ERROR_OUT_OF_MEMORY

我正在尝试在 TensorFlow 中构建一个大型 CNN 并打算在多 GPU 系统上运行它我采用了塔式系统并为两个 GPU 拆分批次同时将变量和其他计算保留在 CPU 上我的系统有 32GB 内存但是当我运行代码时出现错误
TensorFlow 中的 global_step 是什么意思？

在这就是教程代码 https github com tensorflow tensorflow blob master tensorflow examples tutorials mnist mnist py来自 TensorFlow 网站
跨多个 GPU/机器的 TF-Slim 的配置/标志

我很好奇是否有关于如何使用部署 model deploy py 在多台机器上的多个 GPU 上运行 TF Slim models slim 的示例该文档非常好但我缺少一些内容具体来说需要为worker device和ps devic
使用输入管道时如何替换 feed_dict？

假设您有一个已与feed dict到目前为止将数据注入到图表中每隔几个时期我就会通过将任一数据集的一批数据输入到我的图表中来评估训练和测试损失现在出于性能原因我决定使用输入管道看看这个虚拟示例 import tensorflow
Tensorflow推荐的系统规格？

我开始在我的 RHEL 6 5 机器上安装 Tensorflow 但事实证明 Tensorflow 需要 glibc gt 2 17 而 rhel 6 5 上默认的 glibc 是 2 12 我想知道是否有人可以帮助我了解张量流的最低推荐
如何使用 Tensorflow 中的 Hugging Face Transformers 库对自定义数据进行文本分类？

我正在尝试使用 Hugging Face Transformers 库提供的不同变压器架构对自定义数据 csv 格式进行二进制文本分类我正在用这个张量流博客文章 https blog tensorflow org 2019 11 hug
Tensorboard 和 Dropout 层

我有一个非常基本的查询我制作了 4 个几乎相同差异在于输入形状的 CNN 并在连接到全连接层的前馈网络时合并了它们几乎相同的 CNN 的代码 model3 Sequential model3 add Convolution2D 32
AttributeError：模块“keras.engine”没有属性“Layer”

当我试图运行时Parking Slot mask rcnn py文件我收到如下错误mrcnn model py文件我该如何解决 gt 2021 06 17 08 25 18 585897 W tensorflow stream execut
通过 cmake 使用预编译的张量流

我已经建立了一个 C 项目CLion使用CMake 我正在使用各种第三方库并且还想集成张量流我试过了bazel编译张量流到共享库libtensorflow so哪种工作有效但是仍然有相当多的依赖项例如当前的 protobuf 版本
Tensorflow如何生成不平衡组合数据集

我对新数据集 API tensorflow 1 4 有疑问我有两个数据集我需要创建一个组合的不平衡数据集即每个批次应包含第一个数据集中一定数量的元素和第二个数据集中一定数量的元素例如 dataset1 tf data Datase
从字符串列表创建 TfRecords 并在解码后在张量流中提供图形

目的是创建 TfRecords 数据库给定我有 23 个文件夹每个文件夹包含 7500 个图像以及 23 个文本文件每个文件有 7500 行描述单独文件夹中 7500 个图像的特征我通过以下代码创建了数据库 import ten
有没有办法在bigquery中使用kmeans、tensorflow保存的模型？

我知道这有点愚蠢因为 BigQueryML 现在为 Kmeans 提供了良好的初始化尽管如此我还是需要在张量流中训练一个模型然后将其传递给 BigQuery 进行预测我保存了模型一切正常直到我尝试将其上传到 bigquery
无需安装 Tensorflow 即可服务 Tensorflow 模型

我有一个经过训练的模型想在 python 应用程序中使用但我看不到任何在不安装 TensorFlow 或创建 gRPC 服务的情况下部署到生产环境的示例有可能吗在这种情况下正确的做法是什么如果不使用 TensorFlow 本身或
Tensorboard——High-level节点的计算时间与其子节点计算时间的总和不同

继tutorial https www tensorflow org programmers guide graph viz在 TensorFlow 上我试图使用张量板来理解运行时统计数据我发现代表名称范围的高级节点的计算时间不等于其子
交换keras中的张量轴

我想将图像批次的张量轴从 batch size row col ch 交换为批次大小通道行列在 numpy 中这可以通过以下方式完成 X batch np moveaxis X batch 3 1 我该如何在 Keras 中做到
对输入求 Keras 模型的导数返回全零

所以我有一个 Keras 模型我想将模型的梯度应用于其输入这就是我所做的 import tensorflow as tf from keras models import Sequential from keras layers imp

随机推荐

页面刷新和多个选项卡上的 Vuex 状态

在我的应用程序中我使用 firebase API 进行用户身份验证我将登录状态保存为 vuex 状态中的布尔值当用户登录时我将登录状态设置为 true 并使用此功能隐藏顶部菜单上的登录按钮并显示注销按钮当用户注销时反之亦然所以我
为什么注释会生成重复条目？

给出以下代码 payments Payment objects filter customer self customer created at gte kwargs start date created at lte kwargs end
cpp 中未排序数组上的 lower_bound 的行为

我想问 cpp C 中的 lower bound 当应用于未排序的数组时表现如何我的意思是当我运行以下程序时 include
跨域Ajax调用找不到元素位置：moz-nullprincipal

我正在尝试通过 jquery 调用来调用跨域 Web 服务 ajax 服务返回
jQuery UI Sortable - 确定哪个元素位于被拖动的元素下方[关闭]

Closed 这个问题不符合堆栈溢出指南目前不接受答案我在一个简单的无序列表上实现了 jQuery UI 的 Sortable 插件有没有办法确定哪个元素在被拖动的元素下面在这个截图中Row 3 column 1正在盘旋Row 2
找不到 com.google.android.gms:播放服务:3.1.59 3.2.25 4.0.30 4.1.32 4.2.40 4.2.42 4.3.23 4.4.52 5.0.77 5.0.89 5.2.08 6.1。 11 71.6.1 87.6

通过 gradle 引用 play services 对我来说停止了工作把它归结为甚至我首先用作参考的示例也停止工作 https plus google com AndroidDevelopers posts 4Yhpn6p9icf F
远程触发Maven发布

我想从 Java 程序以编程方式启动 Maven 发布这个网页展示了一般是如何完成的这就是我所做的 final URL url new URL http jenkins job MyProject m2release submit fi
温莎城堡：使用约定注册以及具体实现

假设我们有由 Foo 实现的 IFoo 以及由 FirstBar 和 SecondBar 实现的 IBar 使用此约定注册 container Register AllTypes FromThisAssembly Pick WithServ
如何创建具有对角（或有角度）顶线的 div

我是 CSS3 的新手我所知道的都是自学阅读你们或任何其他教程所以经过几个小时的研究和试错我真的需要你们的帮助我正在尝试仅旋转 div 的顶线这就是我到目前为止所做的 http blanc design com sigma2 在
Resteasy 和 Google Guice：如何通过 @Injection 使用多个 @ApplicationPath 和资源？

I 创建了一个项目使用 Resteasy 在我的 Jax rs 资源中测试 Google Guice 提供的依赖项注入我的意图是使用多个 ApplicationPath对于我的 API 的版本在每个类中注释为 ApplicationP
使用正则表达式查找回文

这个问题是为了试图理解以下答案之一如何使用正则表达式检查字符串是否为回文给出的答案马库斯贾德罗 is 1 2 有人可以解释一下这里到底发生了什么我需要做类似的事情Perl 但无法理解这个解决方案 PS 我对 Perl 不太擅长所
GCC不支持简单整数常量表达式？

海湾合作委员会 4 9 和 5 1reject这个简单的全局范围的 C99 声明铿锵接受了 const int a 1 b a error initializer element is not constant 这么基本的功能怎么可能少呢
使用 Google 日历的 Android 应用程序 - 同步问题

我正在尝试创建一个与 Google 日历交互的 Android 应用程序我已按照使用内容提供程序的教程进行操作here 解释了此代码的部分内容here 我面临以下问题我创建了一个新日历测试日历从我的笔记本电脑上在线获取并将其标记为Se
将 fgets() 与 char* 类型一起使用

我有一个关于将 fgets 与 char 字符串一起使用的简单问题 char temp FILE fp fopen test txt r fgets temp 500 fp printf s temp 这段代码运行得不好但我修改后char
Composer View 未将变量加载到视图中

我之前创建了 3 个作曲家视图它们都工作正常但后来我创建了另一个但似乎不起作用我一直在努力让它工作它似乎与我的代码无关我将把其中的一部分放在这里但我仍然不认为这是代码提供者 EvenComposerProvider publ
文件系统 API 在 Chrome v27 和 v29 中不起作用

我正在尝试设置文件存储以供稍后在 Phonegap 中使用但现在在 Chrome 中进行调试按照描述的方式进行html5rocks只允许我向用户请求配额但请求文件系统时的回调不会执行看 window webkitStorageInf
如何从 GUI 应用程序正确终止 QThread？

我尝试使用self terminate 在 QThread 类中还有self thread terminate 在 GUI 类中我也尝试过放self wait 在这两种情况下但是会发生两种情况 1 线程根本没有终止 GUI 冻结等待
何时使用 scala 三重插入符 (^^^) 与双插入符 (^^) 和 into 方法 (>>)

有人可以解释在设计 scala 解析器组合器时如何以及何时使用三重插入符与双插入符吗以及何时如何使用 parser into 方法 gt gt 我将从一个使用 Scala 的示例开始Option类型在一些重要方面类似于Parser
BeanUtils 不适用于链设置器

e g class tester Test public void testBeanUtils throws InvocationTargetException IllegalAccessException NoSuchMethodExce
Tensorflow 汇总合并错误：形状 [-1,784] 具有负尺寸

我试图总结下面神经网络的训练过程 import tensorflow as tf import numpy as np from tensorflow examples tutorials mnist import input data m

Tensorflow 汇总合并错误：形状 [-1,784] 具有负尺寸

Tensorflow 汇总合并错误：形状 [-1,784] 具有负尺寸 的相关文章

随机推荐

热门标签

Tensorflow 汇总合并错误：形状 [-1,784] 具有负尺寸的相关文章