2.4scope

name_scope

variable_scope

scope (name_scope/variable_scope)

from __future__ import print_function

import tensorflow as tf

with tf.name_scope("a_name_scope"):

    initializer = tf.constant_initializer(value=1)

    var1 = tf.get_variable(name='var1', shape=[1], dtype=tf.float32, initializer=initializer)

    var2 = tf.Variable(name='var2', initial_value=[2], dtype=tf.float32)

    var21 = tf.Variable(name='var2', initial_value=[2.1], dtype=tf.float32)

    var22 = tf.Variable(name='var2', initial_value=[2.2], dtype=tf.float32)

with tf.Session() as sess:

    sess.run(tf.initialize_all_variables())

    print(var1.name)        # var1:0 此种get_variable对于name_scope无效

    print(sess.run(var1))   # [ 1.]

    print(var2.name)        # a_name_scope/var2:0

    print(sess.run(var2))   # [ 2.]

    print(var21.name)       # a_name_scope/var2_1:0

    print(sess.run(var21))  # [ 2.0999999]

    print(var22.name)       # a_name_scope/var2_2:0

    print(sess.run(var22))  # [ 2.20000005]

with tf.variable_scope("a_variable_scope") as scope:

    initializer = tf.constant_initializer(value=3)

    var3 = tf.get_variable(name='var3', shape=[1], dtype=tf.float32, initializer=initializer)

    var4 = tf.Variable(name='var4', initial_value=[4], dtype=tf.float32)

    var4_reuse = tf.Variable(name='var4', initial_value=[4], dtype=tf.float32)

    scope.reuse_variables()  #定义了可重复利用

    var3_reuse = tf.get_variable(name='var3',)

with tf.Session() as sess:

    # tf.initialize_all_variables() no long valid from

    # 2017-03-02 if using tensorflow >= 0.12

    if int((tf.__version__).split('.')[1]) < 12 and int((tf.__version__).split('.')[0]) < 1:

        init = tf.initialize_all_variables()

    else:

        init = tf.global_variables_initializer()

    sess.run(init)

    print(var3.name)            # a_variable_scope/var3:0

    print(sess.run(var3))       # [ 3.]

    print(var4.name)            # a_variable_scope/var4:0

    print(sess.run(var4))       # [ 4.]

    print(var4_reuse.name)      # a_variable_scope/var4_1:0

    print(sess.run(var4_reuse)) # [ 4.]

    print(var3_reuse.name)      # a_variable_scope/var3:0

    print(sess.run(var3_reuse)) # [ 3.]

通常在RNN中有一个重复循环机制，比如在training中和test中的结构是不同的，但是在两者的参数是相同的时候，就可以用到

scope.reuse_variables()

# visit https://morvanzhou.github.io/tutorials/ for more!

# 22 scope (name_scope/variable_scope)

from __future__ import print_function

import tensorflow as tf

class TrainConfig:

    batch_size = 20

    time_steps = 20

    input_size = 10

    output_size = 2

    cell_size = 11

    learning_rate = 0.01

class TestConfig(TrainConfig):

    time_steps = 1

class RNN(object):

    def __init__(self, config):

        self._batch_size = config.batch_size

        self._time_steps = config.time_steps

        self._input_size = config.input_size

        self._output_size = config.output_size

        self._cell_size = config.cell_size

        self._lr = config.learning_rate

        self._built_RNN()

    def _built_RNN(self):

        with tf.variable_scope('inputs'):

            self._xs = tf.placeholder(tf.float32, [self._batch_size, self._time_steps, self._input_size], name='xs')

            self._ys = tf.placeholder(tf.float32, [self._batch_size, self._time_steps, self._output_size], name='ys')

        with tf.name_scope('RNN'):

            with tf.variable_scope('input_layer'):

                l_in_x = tf.reshape(self._xs, [-1, self._input_size], name='2_2D')  # (batch*n_step, in_size)

                # Ws (in_size, cell_size)

                Wi = self._weight_variable([self._input_size, self._cell_size])

                print(Wi.name)

                # bs (cell_size, )

                bi = self._bias_variable([self._cell_size, ])

                # l_in_y = (batch * n_steps, cell_size)

                with tf.name_scope('Wx_plus_b'):

                    l_in_y = tf.matmul(l_in_x, Wi) + bi

                l_in_y = tf.reshape(l_in_y, [-1, self._time_steps, self._cell_size], name='2_3D')

            with tf.variable_scope('cell'):

                cell = tf.contrib.rnn.BasicLSTMCell(self._cell_size)

                with tf.name_scope('initial_state'):

                    self._cell_initial_state = cell.zero_state(self._batch_size, dtype=tf.float32)

                self.cell_outputs = []

                cell_state = self._cell_initial_state

                for t in range(self._time_steps):

                    if t > 0: tf.get_variable_scope().reuse_variables()

                    cell_output, cell_state = cell(l_in_y[:, t, :], cell_state)

                    self.cell_outputs.append(cell_output)

                self._cell_final_state = cell_state

            with tf.variable_scope('output_layer'):

                # cell_outputs_reshaped (BATCH*TIME_STEP, CELL_SIZE)

                cell_outputs_reshaped = tf.reshape(tf.concat(1, self.cell_outputs), [-1, self._cell_size])

                Wo = self._weight_variable((self._cell_size, self._output_size))

                bo = self._bias_variable((self._output_size,))

                product = tf.matmul(cell_outputs_reshaped, Wo) + bo

                # _pred shape (batch*time_step, output_size)

                self._pred = tf.nn.relu(product)    # for displacement

        with tf.name_scope('cost'):

            _pred = tf.reshape(self._pred, [self._batch_size, self._time_steps, self._output_size])

            mse = self.ms_error(_pred, self._ys)

            mse_ave_across_batch = tf.reduce_mean(mse, 0)

            mse_sum_across_time = tf.reduce_sum(mse_ave_across_batch, 0)

            self._cost = mse_sum_across_time

            self._cost_ave_time = self._cost / self._time_steps

        with tf.name_scope('trian'):

            self._lr = tf.convert_to_tensor(self._lr)

            self.train_op = tf.train.AdamOptimizer(self._lr).minimize(self._cost)

    @staticmethod

    def ms_error(y_pre, y_target):

        return tf.square(tf.sub(y_pre, y_target))

    @staticmethod

    def _weight_variable(shape, name='weights'):

        initializer = tf.random_normal_initializer(mean=0., stddev=0.5, )

        return tf.get_variable(shape=shape, initializer=initializer, name=name)

    @staticmethod

    def _bias_variable(shape, name='biases'):

        initializer = tf.constant_initializer(0.1)

        return tf.get_variable(name=name, shape=shape, initializer=initializer)

if __name__ == '__main__':

    train_config = TrainConfig()

    test_config = TestConfig()

    # the wrong method to reuse parameters in train rnn

    with tf.variable_scope('train_rnn'):

        train_rnn1 = RNN(train_config)  #参数在train和test都是一致的

    with tf.variable_scope('test_rnn'):

        test_rnn1 = RNN(test_config)    #参数在train和test都是一致的

# the right method to reuse parameters in train rnn
　　with tf.variable_scope('rnn') as scope:
　　　　sess = tf.Session()
　　　　train_rnn2 = RNN(train_config)
　　　　scope.reuse_variables()
　　　　test_rnn2 = RNN(test_config)
　　　　# tf.initialize_all_variables() no long valid from
　　　　# 2017-03-02 if using tensorflow >= 0.12
　　　　if int((tf.__version__).split('.')[1]) < 12 and int((tf.__version__).split('.')[0]) < 1:
　　　　　　init = tf.initialize_all_variables()
　　　　else:
　　　　　　init = tf.global_variables_initializer()
　　　　sess.run(init)

2.4scope的更多相关文章

随机推荐

VMWare------启动虚拟机时出现“start booting fron CD... Error loading image:DFEAULT.EZB”提示
提示详情: start booting fron CD... Error loading image:DFEAULT.EZB 解决方法: iso镜像文件有问题,需要下载正确的镜像文件 MSDN下载地址 ...
UVA 1232 - SKYLINE(线段树)
UVA 1232 - SKYLINE option=com_onlinejudge&Itemid=8&page=show_problem&category=502&pr ...
今天被坑了，而且被坑的好爽！该死的UTF-8 有 BOM 格式编码
调一个项目,最后无法登录了. 排查到最后发现是cookie无法保存会话ID, 工作两年的经验这时候没用上. 开始一以为是PHP.ini的配置错了. 考虑过域名,浏览器问题. 脚本BUG. 最后最后一步 ...
thinkjs+swagger Editor
一直很好奇专门写接口同事的工作,于是趁着手边工作中的闲暇时间,特地看看神奇的接口文档怎么摆弄. 总览: 这是基于thinkjs(3.0),使用swagger editor编写,实现功能性测试的接口文档 ...
js 中的break continue return
break:跳出整个循环 1.当i=6时,就跳出了整个循环,此for循环就不继续了: continue:跳出当前循环,继续下一次循环: return :指定函数返回值 1.在js当中,常使用retur ...
mysql check约束无效
转自http://blog.csdn.net/maxint64/article/details/8643288 今天在mysql中尝试使用check约束时,才知道在MySQL中CHECK约束是无效的, ...
(转载)JVM实现synchronized的底层机制
目前在Java中存在两种锁机制:synchronized和Lock,Lock接口及其实现类是JDK5增加的内容,其作者是大名鼎鼎的并发专家Doug Lea.本文并不比较synchronized与Loc ...
Bypassing PatchGuard on Windows x64
[说明] 1. 本文是意译,加之本人英文水平有限.windows底层技术属菜鸟级别,本文与原文存在一定误差,请多包涵. 2. 由于内容较多,从word拷贝过来排版就乱了.故你也可以下载附件. 3. ...
页面调用Iframe中数据
<iframe src="html的路径(至于MVC中cshtml直接路径好像是不行的,得使用action进行请求出来的路径)" id="iframechild&q ...
Android中Adapter总结
根据一个制作列表的程序开始练手,结果就出现了学习安卓的第一个代码问题运行程序发现,虽然报错,但是可以成功运行程序. Android中Adapter功能为显示ListView,最常用的有ArrayA ...

2.4scope

name_scope

variable_scope

2.4scope的更多相关文章

随机推荐

热门专题