请问是tf.reshape出的问题吗？

import tensorflow as tf
import readtxt2 as read
import datetime
import numpy as np
import os

os.environ['TF_CPP_MIN_LOG_LEVEL'] = '3'


class Config(object):
    # 目标分类数目
    numClasses = 3
    # 拼接长度
    # 最大句长
    maxSeqLength = 64
    # 词向量长度
    numDimensions = 200
    # 最大简称句长
    KEEP_PROB = 0.1  # dropout率
    HIDDEN_SIZE = 64   # lstm隐层单元个数
    NUM_LAYERS = 1      # lstm层数
    VOCAB_SIZE = 10000  # 词表大小

    LEARNING_RATE = 0.002  # 学习率
    TRAIN_BATCH_SIZE = 64  # 训练batch大小
    grad_clip = 4.0         #gradient clipping threshold

    # 测试阶段，batch设置为1
    EVAL_BATCH_SIZE = 1
    EVAL_NUM_STEP = 1
    attention_size = 64    # the size of attention layer
class PbAttention(object):
    def __init__(self, config, is_training, word_vectors):
        self.config = config
        self.batch_size = tf.compat.v1.placeholder(tf.int32, name='batch_size')
        # 目标分类
        self.input_class = tf.compat.v1.placeholder(tf.int32, [None, self.config.numClasses], name="input_class")
        # 命中文本
        self.input_line = tf.compat.v1.placeholder(tf.int32, [None, self.config.maxSeqLength], name="input_line")
    
        self.is_training = is_training
        self.global_step = tf.Variable(0, trainable=False, name='global_step')
        self.sequence_lengths = tf.compat.v1.placeholder(tf.int32, shape=[0], name="sequence_lengths")
        # [词表大小， 词的向量表示]
        self.embedding = tf.compat.v1.get_variable("embedding", shape=[len(word_vectors), 200], initializer=tf.initializers.GlorotUniform(word_vectors))
       
        self.rnn(self.is_training)
        tensor_info_x = tf.saved_model.utils.build_tensor_info(self.input_line)
        tensor_info_y = tf.saved_model.utils.build_tensor_info(self.y_pred_cls)
        self.tensor_info_x = tensor_info_x
        self.tensor_info_y = tensor_info_y
        logdir = "tensorboard/" + datetime.datetime.now().strftime("%Y%m%d-%H%M%S") + "/"
        self.logdir = logdir
        merged = tf.summary.merge_all()
        self.merged = merged
    def rnn(self, is_training):
        # Define Basic RNN Cell
        def basic_rnn_cell(rnn_size):
            # return tf.contrib.rnn.GRUCell(rnn_size)
            return tf.contrib.rnn.LSTMCell(rnn_size, state_is_tuple=True)

        # Define Forward RNN Cell
        with tf.name_scope('fw_rnn'):
            fw_rnn_cell = tf.contrib.rnn.MultiRNNCell([basic_rnn_cell(self.config.HIDDEN_SIZE) for _ in range(self.config.NUM_LAYERS)])
            if is_training:
                fw_rnn_cell = tf.contrib.rnn.DropoutWrapper(fw_rnn_cell, output_keep_prob=self.config.KEEP_PROB)

        # Define Backward RNN Cell
        with tf.name_scope('bw_rnn'):
            bw_rnn_cell = tf.contrib.rnn.MultiRNNCell([basic_rnn_cell(self.config.HIDDEN_SIZE) for _ in range(self.config.NUM_LAYERS)])
            if is_training:
                bw_rnn_cell = tf.contrib.rnn.DropoutWrapper(bw_rnn_cell, output_keep_prob=self.config.KEEP_PROB)

        # Embedding layer
        with tf.name_scope('embedding_line'):
            input_line_vec = tf.nn.embedding_lookup(self.embedding, self.input_line)
            tf.summary.histogram("input_line_vec", input_line_vec)

        with tf.name_scope('bi_rnn'):
            rnn_output, _ = tf.nn.bidirectional_dynamic_rnn(fw_rnn_cell, bw_rnn_cell, inputs=input_line_vec,
                                                            sequence_length=self.sequence_lengths, dtype=tf.float32)
            tf.summary.histogram("rnn_output", rnn_output)
        if isinstance(rnn_output, tuple):
            rnn_output = tf.concat(rnn_output, 2)

            # Attention Layer
        with tf.name_scope('attention'):
            input_shape = rnn_output.shape  # (batch_size, sequence_length, hidden_size)
            sequence_size = input_shape.as_list[1].value  # the length of sequences processed in the RNN layer
            hidden_size = input_shape.as_list[2].value  # hidden size of the RNN layer
            attention_w = tf.Variable(tf.truncated_normal([hidden_size, self.config.attention_size], stddev=0.1),
                                      name='attention_w')
            attention_b = tf.Variable(tf.constant(0.1, shape=[self.config.attention_size]), name='attention_b')
            attention_u = tf.Variable(tf.truncated_normal([self.config.attention_size], stddev=0.1), name='attention_u')
            # tf.summary.distribution("attention_w", attention_w)
            z_list = []
            for t in range(sequence_size):
                u_t = tf.tanh(tf.matmul(rnn_output[:, t, :], attention_w) + tf.reshape(attention_b, [1, -1]))
                z_t = tf.matmul(u_t, tf.reshape(attention_u, [-1, 1]))
                z_list.append(z_t)
            # Transform to batch_size * sequence_size  hideen
            attention_z = tf.concat(z_list, axis=1)

            self.alpha = tf.nn.softmax(attention_z)

            attention_output = tf.reduce_sum(rnn_output * tf.reshape(self.alpha, [-1, sequence_size, 1]), 1)
            tf.summary.histogram("alpha", self.alpha)
            tf.summary.histogram("attention_output", attention_output)
            # attention_output shape: (batch_size, hidden_size)
            # Add dropout
        with tf.name_scope('dropout'):
            # attention_output shape: (batch_size, hidden_size)
            self.final_output = tf.nn.dropout(attention_output, rate=self.config.KEEP_PROB)
            tf.summary.histogram("final_output", self.final_output)

        # Fully connected layer
        with tf.name_scope('output'):
            fc_w = tf.Variable(tf.truncated_normal([hidden_size, self.config.numClasses], stddev=0.1), name='fc_w')
            fc_b = tf.Variable(tf.zeros([self.config.numClasses]), name='fc_b')
            # 目标向量
            self.logits = tf.matmul(self.final_output, fc_w) + fc_b

            self.y_pred_cls = tf.argmax(self.logits, 1, name='predictions')
            tf.summary.histogram("fc_w", fc_w)
            tf.summary.histogram("fc_b", fc_b)
            tf.summary.histogram("logits", self.logits)
            tf.summary.histogram("y_pred_cls", self.y_pred_cls)
        # Calculate cross-entropy loss
        with tf.name_scope('loss'):
            cross_entropy = tf.nn.softmax_cross_entropy_with_logits(logits=self.logits, labels=self.input_class)
            self.loss = tf.reduce_mean(cross_entropy)
            tf.summary.scalar("loss", self.loss)

        # Create optimizer
        with tf.name_scope('optimization'):
            optimizer = tf.train.AdamOptimizer(self.config.LEARNING_RATE)
            gradients, variables = zip(*optimizer.compute_gradients(self.loss))
            gradients, _ = tf.clip_by_global_norm(gradients, self.config.grad_clip)
            self.optim = optimizer.apply_gradients(zip(gradients, variables), global_step=self.global_step)
    

        # Calculate accuracy
        with tf.name_scope('accuracy'):
            correct_pred = tf.equal(self.y_pred_cls, tf.argmax(self.input_class, 1))
            self.acc = tf.reduce_mean(tf.cast(correct_pred, tf.float32))
            tf.summary.scalar("accuracy", self.acc)
def get_sequence_length(x_batch):
    """
    Args:
        x_batch:a batch of input_data
    Returns:
        sequence_lenghts: a list of acutal length of  every senuence_data in input_data
    """
    sequence_lengths=[]
    for x in x_batch:
        actual_length = np.sum(np.sign(x))
        sequence_lengths.append(actual_length)
    return sequence_lengths
def run_epoch(session, model, data, target, eval_data, eval_target):
    writer = tf.summary.FileWriter(model.logdir, session.graph)
    saver = tf.train.Saver()
    # state = session.run(model.initial_state)    # vlstm单元初始状态
    batch_size = 128
    # 训练一个epoch。
    steps = 5000
    dataset_size = len(target)
    dataset_size = (dataset_size // batch_size) * batch_size
    eval_dataset_size = len(eval_target)
    eval_dataset_size = (eval_dataset_size // batch_size) * batch_size
    for step in range(steps):
        # 每次选取batch_size个样本训练
        start = (step * batch_size) % dataset_size
        end = min(start + batch_size, dataset_size)
        x_batch = data[start:end]
        sequence_lengths = get_sequence_length(x_batch)
        _batch_size1 = end - start + 1
        optimizer, summary, accuracy = session.run([model.optim, model.merged, model.acc],
                                                   {model.input_line: x_batch, model.input_class: target[start:end],
                                                    model.sequence_lengths: sequence_lengths,
                                                    model.batch_size: _batch_size1
                                                    })
        if step % 10 == 0:
            # summary = session.run(model.merged, {model.sequence_lengths: sequence_lengths,
            #                                      model.input_line: x_batch,
            #                                      model.input_class: target[start:end],
            #                                      model.batch_size: batch_size})
            writer.add_summary(summary, step)
            # print(step, optimizer)
        if step % 20 == 0:
            # accuracy = session.run(model.acc, {model.sequence_lengths: sequence_lengths,
            #                                    model.input_line: x_batch,
            #                                    model.input_class: target[start:end],
            #                                    model.batch_size: batch_size})
            print("step: %d accuracy: %g time: %s" % (step, accuracy, datetime.datetime.now().strftime("%Y%m%d-%H%M%S")))
            # Save the network every 10,000 training iterations
            # if step % 5000 == 0 and step != 0:
        if step % 100 == 0 and step != 0:
            eval_step = step // 100
            eval_start = (eval_step * 1000) % eval_dataset_size
            eval_end = min(eval_start + 1000, eval_dataset_size)
            eval_batch = eval_data[eval_start:eval_end]
            eval_batch_class = eval_target[eval_start:eval_end]
            eval_sequence_lengths = get_sequence_length(eval_batch)
            _batch_size = eval_end - eval_start + 1
            optimizer, summary, accuracy = session.run([model.optim, model.merged, model.acc],
                                                       {model.input_line: eval_batch,
                                                        model.input_class: eval_batch_class,
                                                        model.sequence_lengths: eval_sequence_lengths,
                                                        model.batch_size: _batch_size
                                                        })
            print("eval step: %d accuracy: %g time: %s" % (step, accuracy, datetime.datetime.now().strftime("%Y%m%d-%H%M%S")))
            if accuracy > 0.92 and step > 1000:
                break
                # save_path = saver.save(session, "model/"+str(step)+"/pretrained_lstm.ckpt", global_step=step)
                # print("saved to %s" % save_path)

    save_path = saver.save(session, "pretrained_lstm.ckpt", global_step=step)
    print("saved to %s" % save_path)
    writer.close()

def main():
    g_2 = tf.Graph()

    with g_2.as_default():
        words_list, word_vectors, words_list_map = read._read_word2vec("gbn-word2vector.txt")
        print("----------------------------------bg-1------------------------------")
        # print(words_list.__le__())
        # print(len(word_vectors))
        #print(len(words_list_map))

        targets, words= read._read_train_data("padata-1.txt")
        print("----------------------------------bg-2------------------------------")

        config = Config()
        datax = read._train_uniondata_index(words, config.maxSeqLength,  words_list_map)
        print("----------------------------------bg-------------------------------")
        eval_targets, eval_words = read._read_train_data("padatapre-1.txt")
        eval_datax = read._train_uniondata_index(eval_words, config.maxSeqLength,  words_list_map)
        print("----------------------------------bg-veal-------------------------------")
        initializer = tf.random_uniform_initializer(-0.05, 0.05)
        with tf.compat.v1.variable_scope("language_model", reuse=None, initializer=initializer):
            train_model = PbAttention(config, True, word_vectors)
        with tf.Session(graph=g_2) as session:
            tf.global_variables_initializer().run()
            for i in range(1):
                print("In iteration: %d" % (i + 1))
                run_epoch(session, train_model, datax, targets, eval_datax, eval_targets)
            train_model.is_training = False
            prediction_signature = tf.saved_model.signature_def_utils.build_signature_def(
                inputs={'input-x': train_model.tensor_info_x},
                outputs={'out-y':train_model.tensor_info_y})
            legacy_init_op = tf.group(tf.tables_initializer(), name='legacy_init_op')
			# 保存训练模型 java 要调用
            builder = tf.saved_model.builder.SavedModelBuilder("model/pb/"
                                                               + datetime.datetime.now().strftime("%Y%m%d-%H%M%S"))
            builder.add_meta_graph_and_variables(
                session, [tf.saved_model.tag_constants.SERVING],
                signature_def_map={
                    'predict_data': prediction_signature},
                legacy_init_op=legacy_init_op)
            builder.save(False)
    graph_def = g_2.as_graph_def()
    tf.train.write_graph(graph_def, "models/pb1/" + datetime.datetime.now().strftime("%Y%m%d-%H%M%S"), 'expert-graph.pb', as_text=False)
    tf.train.write_graph(graph_def, "models/pb1/" + datetime.datetime.now().strftime("%Y%m%d-%H%M%S"), 'expert-graph2.pb', as_text=True)

if __name__ == "__main__":
    print(1)
    main()

写回答
好问题 0 提建议
追加酬金
关注问题
分享
邀请回答
编辑收藏删除结题
收藏举报

2条回答默认最新

关注

码龄粉丝数原力等级 --

被采纳

被点赞

采纳率
weixin_51197078 2021-06-12 21:53
关注
急！！！

解决无用
评论打赏
分享
举报

评论

按下Enter换行，Ctrl+Enter发表内容

报告相同问题？

关注问题

如何在C++中实现python的np.reshape c++ opencv python 有问必答
2021-08-17 08:58

回答 2 已采纳 Mat 好像有个reshape()成员函数，具体的你可以查一查API，是可以用的。但是你的这个你确定没有问题吗？经过opencv的blob之后一般都是NCHW的输入,也就是你的blob是（batch，
机器学习自制数据集，关于将图片处理成数值过程中array数组reshape的问题 python 开发语言机器学习
2022-05-13 19:32

回答 1 已采纳为了满足框架中模型的输入格式要求
Matlab reshape怎么用？ matlab
2022-11-22 23:22

回答 1 已采纳 reshape就是重新自定义修改矩阵的结构，比如3行2列矩阵改成2行3列矩阵，前提是矩阵修改前后的元素数目要匹配，不能说把一个4行4列的矩阵修改成1行1列的元素吧。所以你的A有9个元素，而1行2列矩阵
深入浅出TensorFlow2函数——tf.reshape
2023-03-09 20:08

von Neumann的博客 tf.reshape
x=np.arange(4).reshape(2,2)，print(np.mean(x,axis=1))的输出结果是（） python
2022-07-13 00:15

回答 1 已采纳运行下就知道了输出结果是 [0.5 2.5] import numpy as np x=np.arange(4).reshape(2,2) print(np.mean(x,axis=1))
出现cannot reshape array of size 27749792 into shape (300,1) python 人工智能深度学习
2022-10-16 21:54

回答 2 已采纳 27749492/300无法整除啊，也就是reshape到300列，你的行数不对，最后一行少几个参数，所以会报错。[:, 300]是切片，相当于将列号为300列的这一列切分出来。
Python这是哪里的错误啊？ python tensorflow 人工智能
2022-12-17 16:58

回答 1 已采纳把你的第7行代码，data.files删除望采纳
[AI算法][TensorFlow]：tensorflow学习笔记-tf.reshape()--tf.transpose() / np.resahpe()---np.transpose()
2020-08-19 17:24

Way_X的博客说明：这两个维度变换操作，对于...都是“高维数组”的科学计算库，只不过TF把高维数组又起了一个名字叫“张量”而已。因此：高维数组与张量没有本质区别！只不过张量多了一个属性叫“张量的阶”（其实就是这个高维.
np.load报错 ValueError: cannot reshape array pycharm python 有问必答深度学习
2021-12-14 10:01

回答 1 已采纳你这里提示错误是因为数组的长度为19429344 分割后的五维数组为(53018,1,17,25,25) 原始数组不能达到这个分割后的数组长度,所以不能分割.你需要检查x_1_25_final_arr
麻烦大家帮我debug一个reshape array的问题 tensorflow 机器学习深度学习自然语言处理
2020-10-16 05:03

回答 1 已采纳？什么意思，128754个元素要怎么转成 1 x 1118的格式啊？
关于Python中的reshape,order相关问题 python
2019-08-11 21:36

回答 1 已采纳首先 1 2 3 4 5 6 7 8 按照列得到序列 1 5 2 6 3 7 4 8 然后按照f reshape成4 2 1 5 2 6 3 7 4 8 上下对齐得到 1 3 5
『tensorflow笔记』tf.reshape的详细讲解
2019-01-05 19:39

AI新视界的博客 tf.reshape( tensor, shape, name=None ) tensor形参传入一个tensor。shape传入一个向量，代表新tensor的维度数和每个维度的长度。如果传入[3,4,5]，就会返回一个内含各分量数值和原传入张量一模一样的3*4*5...
TensorFlow的reshape操作 tf.reshape
2018-08-17 15:57

Ai_践行者的博客大意是说，数组新的shape属性应该要与原来的配套，如果等于-1的话，那么Numpy会根据剩下的维度计算出数组的另外一个shape属性值。举几个例子或许就清楚了，有一个数组z，它的shape属性是(4, 4) z = np.array([[1...
【Tensorflow】tf.reshape 函数
2017-04-20 12:03

zj360202的博客 tf.reshape(tensor, shape, name=None) 数据重定形状函数参数： tensor：输入数据shape：目标形状 name：名称返回：Tensor 例： # tensor 't' is [1, 2, 3, 4, 5, 6, 7, 8, 9] # tensor 't' 的形状就是 [9]...
x = tf.reshape(x, shape = [-1, 28, 28, 1])中-1的解释
2021-11-08 17:09

nwsuaf_huasir的博客 x = tf.reshape(x, shape = [-1, 28, 28, 1]) 其中的参数：-1让我不知所措，其实他就是一种参数的省略，几个例子 z = np.array([[1, 2, 3, 4], [5, 6, 7, 8], [9, 10, 11, 12], [13, 14, 15, 16]]) z.shape (4...
分析tf.reshape(v3, [2,2,3,1,3,1,1,1,1])中[2,2,3,1,3,1,1,1,1]是什么形状？
2020-06-12 16:38

小鹏AI的博客 tf.reshape(v3, [2,2,3,1,3,1,1,1,1]) 今天学习TensorFlow时候，接触到了张量的形状的变换问题，变换的这个问题比较好理解（理解如下） reshape(tensor, shape, name=None) tensor：被调整维度的张量 shape：要...
深入浅出TensorFlow2函数——tf.keras.layers.Dense
2023-03-05 21:45

von Neumann的博客 tf.keras.layers.Dense
tf.tile函数
2022-05-23 15:18

不负韶华ღ的博客函数原型 tf.tile( input, multiples, name=None ) 函数说明 tile函数主要用于张量的扩充，参数multiples表示扩充的... a = tf.reshape(tf.range(4), (2, 2)) >>> a <tf.Tensor: shape=(2, 2), dtype=in
解决keras.backend.reshape函数结果全是None（None,None,None,None)问题，将三维新增一维None方法
2022-05-10 20:14

qq_821852343的博客解决keras.backend.reshape函数结果全是None（None,None,None,None)问题，将三维新增一维None方法
tf.one_hot()的用法（详细解释）
2022-07-05 12:40

Gerald走心的博客 i 时填充输出的值的标量，默认为0 axis=None, #要填充的轴，默认为-1，即一个新的最内层轴 dtype=None, name=None ) 例子1 indices = [0, 2, -1, 1] #输入数据(是个向量)的需要编码的索引是[0,2,-1,1] depth = 3 tf....
没有解决我的问题, 去提问

悬赏问题

¥15 #MATLAB仿真#车辆换道路径规划
¥15 java 操作 elasticsearch 8.1 实现索引的重建
¥15 数据可视化Python
¥15 要给毕业设计添加扫码登录的功能！！有偿
¥15 kafka 分区副本增加会导致消息丢失或者不可用吗？
¥15 微信公众号自制会员卡没有收款渠道啊
¥100 Jenkins自动化部署—悬赏100元
¥15 关于#python#的问题：求帮写python代码
¥20 MATLAB画图图形出现上下震荡的线条
¥15 关于#windows#的问题：怎么用WIN 11系统的电脑克隆WIN NT3.51-4.0系统的硬盘

请问是tf.reshape出的问题吗？

2条回答 默认 最新

悬赏问题

2条回答默认最新