请大神指点，VGG-16训练时权重不更新，怎么回事？？

用tensorflow训练VGG-16时，权重不发生变化是怎么回事？？

 import tensorflow as tf
import scipy.io as sio 
#import numpy as np
import matplotlib.image as mpimg
import pickle as cp
a = list(sio.loadmat('dataset/corel5k_train_annot.mat')['annot1'])
b = list(sio.loadmat('dataset/corel5k_test_annot.mat')['annot2'])
def get_batch(image, label, batch_size, now_batch, total_batch):

    if now_batch < total_batch-1:
        image_batch = image[now_batch*batch_size:(now_batch+1)*batch_size]
        label_batch = label[now_batch*batch_size:(now_batch+1)*batch_size]
    else:
        image_batch = image[now_batch*batch_size:]
        label_batch 


= label[now_batch*batch_size:]
    #image_batch = tf.reshape(image_batch,[-1,128,128,3])

    return  image_batch,label_batch

train_img = []
with open('image/corel5k_train_list.txt') as f:
    for i in f.readlines():
        train_img += [mpimg.imread('image/%s.jpg'%i.strip())]
    cp.dump(train_img,open("train.pkl","wb"))
test_img = []
with open('image/corel5k_test_list.txt') as f:
    for i in f.readlines():
        test_img += [mpimg.imread('image/%s.jpg'%i.strip())]
    cp.dump(test_img,open("test.pkl","wb"))#一种保存列表的方式

x = tf.placeholder(tf.float32,[None,128,128,3])
y_ = tf.placeholder(tf.float32, shape=[None, 260])
#loss=tf.Variable(tf.constant(0.0))
#第一
W1 = tf.Variable(tf.truncated_normal([3, 3, 3, 64], mean=0.0,stddev=1.0))
b1 = tf.Variable(tf.constant(0.0, shape=[64]))
h1 =  tf.nn.relu(tf.nn.conv2d(x, W1, strides=[1, 1, 1, 1], padding='SAME') + b1)
#p1 = tf.nn.max_pool(h1, ksize=[1, 2, 2, 1],strides=[1, 2, 2, 1], padding='SAME')

W2 = tf.Variable(tf.truncated_normal([3, 3, 64, 64], mean=0.0,stddev=1.0))
b2 = tf.Variable(tf.constant(0.0, shape=[64]))
h2 = tf.nn.relu(tf.nn.conv2d(h1, W2, strides=[1, 1, 1, 1], padding='SAME') + b2)
p2 = tf.nn.max_pool(h2, ksize=[1, 2, 2, 1],strides=[1, 2, 2, 1], padding='SAME')
#第二
W3 = tf.Variable(tf.truncated_normal([3, 3, 64, 128], mean=0.0,stddev=1.0))
b3 = tf.Variable(tf.constant(0.0, shape=[128]))
h3 = tf.nn.relu(tf.nn.conv2d(p2, W3, strides=[1, 1, 1, 1], padding='SAME') + b3)
#p3 = tf.nn.max_pool(h2, ksize=[1, 2, 2, 1],strides=[1, 2, 2, 1], padding='SAME')

W4 = tf.Variable(tf.truncated_normal([3, 3, 128, 128], mean=0.0,stddev=1.0))
b4 = tf.Variable(tf.constant(0.0, shape=[128]))
h4 = tf.nn.relu(tf.nn.conv2d(h3, W4, strides=[1, 1, 1, 1], padding='SAME') + b4)
p4 = tf.nn.max_pool(h4, ksize=[1, 2, 2, 1],strides=[1, 2, 2, 1], padding='SAME')
#第三
W5 = tf.Variable(tf.truncated_normal([3, 3, 128, 256], mean=0.0,stddev=1.0))
b5 = tf.Variable(tf.constant(0.0, shape=[256]))
h5 = tf.nn.relu(tf.nn.conv2d(p4, W5, strides=[1, 1, 1, 1], padding='SAME') + b5)

W6 = tf.Variable(tf.truncated_normal([3, 3, 256, 256], mean=0.0,stddev=1.0))
b6 = tf.Variable(tf.constant(0.0, shape=[256]))
h6 = tf.nn.relu(tf.nn.conv2d(h5, W6, strides=[1, 1, 1, 1], padding='SAME') + b6)

W7 = tf.Variable(tf.truncated_normal([3, 3, 256, 256], mean=0.0,stddev=1.0))
b7 = tf.Variable(tf.constant(0.0, shape=[256]))
h7 = tf.nn.relu(tf.nn.conv2d(h6, W7, strides=[1, 1, 1, 1], padding='SAME') + b7)
p7 = tf.nn.max_pool(h7, ksize=[1, 2, 2, 1],strides=[1, 2, 2, 1], padding='SAME')

#第四
W8 = tf.Variable(tf.truncated_normal([3, 3, 256, 512], mean=0.0,stddev=1.0))
b8 = tf.Variable(tf.constant(0.0, shape=[512]))
h8 = tf.nn.relu(tf.nn.conv2d(p7, W8, strides=[1, 1, 1, 1], padding='SAME') + b8)

W9 = tf.Variable(tf.truncated_normal([3, 3, 512, 512], mean=0.0,stddev=1.0))
b9 = tf.Variable(tf.constant(0.0, shape=[512]))
h9 = tf.nn.relu(tf.nn.conv2d(h8, W9, strides=[1, 1, 1, 1], padding='SAME') + b9)

W10 = tf.Variable(tf.truncated_normal([3, 3, 512, 512], mean=0.0,stddev=1.0))
b10 = tf.Variable(tf.constant(0.0, shape=[512]))
h10 = tf.nn.relu(tf.nn.conv2d(h9, W10, strides=[1, 1, 1, 1], padding='SAME') + b10)
p10 = tf.nn.max_pool(h10, ksize=[1, 2, 2, 1],strides=[1, 2, 2, 1], padding='SAME')

#第五
W11 = tf.Variable(tf.truncated_normal([3, 3, 512, 512], mean=0.0,stddev=1.0))
b11 = tf.Variable(tf.constant(0.0, shape=[512]))
h11 = tf.nn.relu(tf.nn.conv2d(p10, W11, strides=[1, 1, 1, 1], padding='SAME') + b11)

W12 = tf.Variable(tf.truncated_normal([3, 3, 512, 512], mean=0.0,stddev=1.0))
b12 = tf.Variable(tf.constant(0.0, shape=[512]))
h12 = tf.nn.relu(tf.nn.conv2d(h11, W12, strides=[1, 1, 1, 1], padding='SAME') + b12)

W13 = tf.Variable(tf.truncated_normal([3, 3, 512, 512], mean=0.0,stddev=1.0))
b13 = tf.Variable(tf.constant(0.0, shape=[512]))
h13 = tf.nn.relu(tf.nn.conv2d(h12, W13, strides=[1, 1, 1, 1], padding='SAME') + b13)
p13 = tf.nn.max_pool(h13, ksize=[1, 2, 2, 1],strides=[1, 2, 2, 1], padding='SAME')

W_fc1 = tf.Variable(tf.truncated_normal([4*4*512, 4096], mean=0.0,stddev=1.0))
b_fc1 = tf.Variable(tf.constant(0.0, shape=[4096]))
h_pool2_flat = tf.reshape(p13, [-1, 4*4*512])
h_fc1 = tf.nn.relu(tf.matmul(h_pool2_flat, W_fc1) + b_fc1)

keep_prob1 = tf.placeholder(tf.float32)
h_fc1_drop = tf.nn.dropout(h_fc1, keep_prob1)

W_fc2 = tf.Variable(tf.truncated_normal([4096, 4096], mean=0.0,stddev=1.0))
b_fc2 = tf.Variable(tf.constant(0.0, shape=[4096]))
h_fc2 = tf.nn.relu(tf.matmul(h_fc1_drop, W_fc2) + b_fc2)

keep_prob2 = tf.placeholder(tf.float32)
h_fc2_drop = tf.nn.dropout(h_fc2, keep_prob2)

W_fc3 = tf.Variable(tf.truncated_normal([4096, 260], mean=0.0,stddev=1.0))
b_fc3 = tf.Variable(tf.constant(0.0, shape=[260]))
y_conv=tf.nn.softmax(tf.matmul(h_fc2_drop, W_fc3) + b_fc3)


loss = tf.reduce_mean(-tf.reduce_sum(y_*tf.log(y_conv + 1e-10), reduction_indices=[1]))

train_step = tf.train.AdamOptimizer(0.1).minimize(loss)



with tf.Session() as sess:
    sess.run(tf.global_variables_initializer())
    for v in range(100):
        for r in range(90):
            image_batch,label_batch = get_batch(train_img,a,50,r,90)
            sess.run(train_step,feed_dict={x:image_batch,y_:label_batch,keep_prob1: 0.5,keep_prob2: 0.5})
        print(sess.run(W_fc3))


    print("*")
    test_batch,testlabel_batch = get_batch(test_img,b,50,0,2)
    print(sess.run(loss,feed_dict={x:test_batch,y_:testlabel_batch,keep_prob1: 1,keep_prob2: 1}))

写回答
好问题 0 提建议
追加酬金
关注问题
分享
邀请回答
编辑收藏删除结题
收藏举报

1条回答默认最新

关注

码龄粉丝数原力等级 --

被采纳

被点赞

采纳率
zqbnqsdsmd 2018-11-15 11:53
关注
https://blog.csdn.net/l627515523/article/details/80166534

解决无用
评论打赏
分享
举报

评论

按下Enter换行，Ctrl+Enter发表内容

报告相同问题？

关注问题

【深度学习】使用自己写的VGG16网络训练精度不提升 pytorch 深度学习神经网络
2022-05-30 00:00

回答 2 已采纳删除最后的softmax层，在内个relu之前加归一化就好了
torchvision中预训练的VGG16和一般论文里的VGG-VD-16有什么区别 pytorch 图像处理深度学习
2023-04-06 16:16

回答 1 已采纳 VGG16 和 VGG-VD-16 在网络结构上是有区别的。VGG16 是 VGG 网络的一种实现，而 VGG-VD-16 则是 VGG 网络的一种变体。 PyTorch 中的 torchvision
vgg19训练图像分类，分成两类，这样训练出来的网络是否过拟合了？人工智能机器学习深度学习
2021-03-23 15:58

回答 3 已采纳 1k5左右就差不多了，过拟合的话不一定，要看下有没有防止过拟合的手段，如果你的项目是开源项目的话，一般会有这方面的限制的。
人工智能_预训练_VGGNet16_图像识别模型预训练权重_可重调
2022-02-13 23:58

人工智能_预训练_VGGNet16_图像识别模型预训练权重_可重调
为什么在pytorch中使用VGG16不用预训练，自己从头训练猫狗分类，正确率只有74%就上不去了？ pytorch 深度学习神经网络
2021-10-21 23:53

回答 1 已采纳官方pretrain的模型数据集是imagenet，样本数是你这个数据集的很多倍，这样的vgg网络卷积层的参数基本收敛到比较好的一个情况，你直接用来finetune只要稍微微调一下最后的fc层就可以得
Vgg16模型分析图片输出的向量维度可以改变吗？机器学习深度学习自然语言处理
2023-03-18 02:20

回答 5 已采纳参考GPT和自己的思路： Vgg16模型是一个预训练的深度卷积神经网络，它由若干个卷积层和池化层构成。在输入一张图片后，模型会输出一个特征向量，该向量的维度通常为1000，用来表示该图片的分类信息。这
如何在VGG网络中加入金字塔结构？ pytorch 神经网络
2021-09-01 15:43

回答 1 已采纳 VGG网络加FPN（金子塔结构）实现起来不难，首先看一下VGG的实现：简介VggNet与其pytorch实现_清华和你，要上一个的博客-CSDN博客_pytorch vggnet 目前正在学
vgg-cifar100:在CIFAR-100上训练的VGG-16的Tensorflow实现
2021-05-17 09:33

CIFAR-100上的VGG-16 在CIFAR-100上训练的VGG网（具有batchnorm和dropout）。您可以通过更改数据加载器类中的一行来轻松修改此代码以在CIFAR-10上进行训练。在不增加数据的情况下达到约64％的准确性。该数据集上...
keras训练二分类模型acc一直0.5 loss一直是0.69怎么办? tensorflow 人工智能深度学习
2021-03-18 16:11

回答 2 已采纳帮你改了下代码，路径你自己再改改，验证集acc能跑到0.8以上了。 import os import tensorflow as tf from tensorflow.keras import S
vgg16每次跑出的结果都相同 tensorflow 深度学习神经网络
2022-04-01 02:02

回答 1 已采纳可以调整参数，多运行几次（cpu跟gpu不影响结果，只是gpu运行快一点）
ModuleNotFoundError: No module named 'vgg'明明有VGG，还出现这个错误 python pytorch 神经网络
2021-08-31 20:17

回答 2 已采纳 ?你import了么
TensorFlow VGG-16 预训练模型-vgg_16.ckpt
2019-02-01 11:54

TensorFlow VGG-16 预训练模型，用于SSD-TensorFlow的Demo训练.
tensorflow预训练模型input格式错误 python tensorflow 人工智能
2023-02-03 11:52

回答 4 已采纳后续增加numpy解决
把vgg-face.mat权重迁移到pytorch模型示例
2020-09-18 05:23

今天小编就为大家分享一篇把vgg-face.mat权重迁移到pytorch模型示例，具有很好的参考价值，希望对大家有所帮助。一起跟随小编过来看看吧
人工智能-项目实践-信息检索-基于VGG-16的图像检索系统
2024-02-29 09:57

基于VGG-16的图像检索系统选取图像特征传统的检索通常采用颜色、形状、纹理、能量等，我们使用深度学习模型（vgg16, resnet50,densenet121）进行特征提取。为了简便，直接用Keras的预训练模型索引化数据集对...
没有解决我的问题, 去提问

悬赏问题

¥15 vue3+express部署到nginx
¥20 搭建pt1000三线制高精度测温电路
¥15 使用Jdk8自带的算法，和Jdk11自带的加密结果会一样吗，不一样的话有什么解决方案，Jdk不能升级的情况
¥15 画两个图 python或R
¥15 在线请求openmv与pixhawk 实现实时目标跟踪的具体通讯方法
¥15 八路抢答器设计出现故障
¥15 opencv 无法读取视频
¥15 按键修改电子时钟，C51单片机
¥60 Java中实现如何实现张量类，并用于图像处理(不运用其他科学计算库和图像处理库）)
¥20 5037端口被adb自己占了

请大神指点，VGG-16训练时权重不更新，怎么回事？？

1条回答 默认 最新

悬赏问题

1条回答默认最新