styleGAN—network.py

源码

以下为network.py中Network类run方法的最后一部分。

class Network:
def run(self,
        *in_arrays: Tuple[Union[np.ndarray, None], ...],
        input_transform: dict = None,
        output_transform: dict = None,
        return_as_list: bool = False,
        print_progress: bool = False,
        minibatch_size: int = None,
        num_gpus: int = 1,
        assume_frozen: bool = False,
        **dynamic_kwargs) -> Union[np.ndarray, Tuple[np.ndarray, ...], List[np.ndarray]]:

   assert len(in_arrays) == self.num_inputs
   assert not all(arr is None for arr in in_arrays)
   assert input_transform is None or util.is_top_level_function(input_transform["func"])
   assert output_transform is None or util.is_top_level_function(output_transform["func"])
   output_transform, dynamic_kwargs = _handle_legacy_output_transforms(output_transform, dynamic_kwargs)
   num_items = in_arrays[0].shape[0]
   if minibatch_size is None:
       minibatch_size = num_items

   # Construct unique hash key from all arguments that affect the TensorFlow graph.
   略
   # Build graph.
   略
   # Run minibatches.
   in_expr, out_expr = self._run_cache[key]
   out_arrays = [np.empty([num_items] + tfutil.shape_to_list(expr.shape)[1:], expr.dtype.name) for expr in out_expr]

   for mb_begin in range(0, num_items, minibatch_size):
       if print_progress:
           print("\r%d / %d" % (mb_begin, num_items), end="")

       mb_end = min(mb_begin + minibatch_size, num_items)
       mb_num = mb_end - mb_begin
       mb_in = [src[mb_begin : mb_end] if src is not None else np.zeros([mb_num] + shape[1:]) for src, shape in zip(in_arrays, self.input_shapes)]
       mb_out = tf.get_default_session().run(out_expr, dict(zip(in_expr, mb_in)))

       for dst, src in zip(out_arrays, mb_out):
           dst[mb_begin: mb_end] = src

   # Done.
   if print_progress:
       print("\r%d / %d" % (num_items, num_items))

   if not return_as_list:
       out_arrays = out_arrays[0] if len(out_arrays) == 1 else tuple(out_arrays)
   return out_arrays
##依赖函数
def shape_to_list(shape: Iterable[tf.Dimension]) -> List[Union[int, None]]: #位于dnnlib/tflib
    """将TFshape转换为列表."""
    return [dim.value for dim in shape]

Run minibatches

in_expr, out_expr是两个list，由于out_arrays是以out_expr为模板创建的，所以它的shape为[1, 1024, 1024, 3]：

# 运行pretrained.py时得到以下结果
>>> print(in_expr)
[<tf.Tensor 'Gs/_Run/latents_in:0' shape=<unknown> dtype=float32>, <tf.Tensor 'Gs/_Run/labels_in:0' shape=<unknown> dtype=float32>]
>>> print(out_expr)
[<tf.Tensor 'Gs/_Run/concat:0' shape=(?, 1024, 1024, 3) dtype=uint8>]
>>> print(tfutil.shape_to_list(expr.shape)[1:])
[1024, 1024, 3]
>>> print(num_items)
1
>>> print([num_items] + tfutil.shape_to_list(expr.shape)[1:])
[1, 1024, 1024, 3]

对Graph中数据流以及作者所定义的scope感兴趣的可以进行以下操作(生成的graph非常清晰，可读性很强，值得学习。)

"""
输出默认Grpah中op以及变量、Tensor等的名字(一般由name_scope或者variable_scope定义)到txt文件；输出Graph到Tensorboard，在终端
中使用“tensorboard --logdir ./logpath”打开。
"""
with open('./graph_names.txt','w') as f:
    sep='\n'
    test_names = [n.name for n in tf.get_default_graph().as_graph_def().node]
    f.write(sep.join(test_names))
    summary_writer = tf.summary.FileWriter("log",tf.get_default_graph())

接下来的for循环中，minibatch为run接收的一个参数，若其为None，则
minibatch_size = num_items，而num_items = in_arrays[0].shape[0]，所以当minibatch为None时。pretrained.py执行过程中，这一for循环只执行一次，并且mb_end和mb_num均为1，所以mb_in是一个包含(1,512)和(1,0)两个np.darray的list，实质上mb_in[0]==in_arrays[0](可用代码(a==b).all()判断两个数组是否完全相同)。
mb_out = tf.get_default_session().run()为真正的预测过程，mb_out即为预测结果。接着，将src(mb_out)中的数据复制到dst中。

最后判断是否需要将输出以list的形式返回。至此，run函数成功返回，实质上整个run中最关键的一句是tf.get_default_session().run()，它获取了默认会话的op和数据流，并将in_expr和mb_infeed给网络。

注：tf.Tensor的尺寸可以通过for dim in tf.Tensor.shape: print(dim.value)来获取，batches的？实际上为None。

get_output_for

get_output_for为类Network中的另一个方法

def get_output_for(self, *in_expr: TfExpression, return_as_list: bool = False, **dynamic_kwargs) -> Union[TfExpression, List[TfExpression]]:
    """Construct TensorFlow expression(s) for the output(s) of this network, given the input expression(s)."""
    assert len(in_expr) == self.num_inputs
    assert not all(expr is None for expr in in_expr)

    # Finalize build func kwargs.
    build_kwargs = dict(self.static_kwargs)
    build_kwargs.update(dynamic_kwargs)
    build_kwargs["is_template_graph"] = False
    build_kwargs["components"] = self.components

    # Build TensorFlow graph to evaluate the network.
    with tfutil.absolute_variable_scope(self.scope, reuse=True), tf.name_scope(self.name):
        assert tf.get_variable_scope().name == self.scope
        valid_inputs = [expr for expr in in_expr if expr is not None]
        final_inputs = []
        for expr, name, shape in zip(in_expr, self.input_names, self.input_shapes):
            if expr is not None:
                expr = tf.identity(expr, name=name)
            else:
                expr = tf.zeros([tf.shape(valid_inputs[0])[0]] + shape[1:], name=name)
            final_inputs.append(expr)
        out_expr = self._build_func(*final_inputs, **build_kwargs)

    # Propagate input shapes back to the user-specified expressions.
    for expr, final in zip(in_expr, final_inputs):
        if isinstance(expr, tf.Tensor):
            expr.set_shape(final.shape)

    # Express outputs in the desired format.
    assert tfutil.is_tf_expression(out_expr) or isinstance(out_expr, tuple)
    if return_as_list:
        out_expr = [out_expr] if tfutil.is_tf_expression(out_expr) else list(out_expr)
    return out_expr
## 以上函数涉及到的其它模块
TfExpression = Union[tf.Tensor, tf.Variable, tf.Operation]
def is_tf_expression(x: Any) -> bool:
    return isinstance(x, (tf.Tensor, tf.Variable, tf.Operation))
def absolute_variable_scope(scope: str, **kwargs) -> tf.variable_scope:
    return tf.variable_scope(tf.VariableScope(name=scope, **kwargs), auxiliary_name_scope=False)

TfExpression被定义为有效的TF表达，它是一个typing.Union，其中包括了tf.Tensor, tf.Variable, tf.Operation。然后我们看一下字典的update方法：

>>> a = {'1': 11,'2': 22,'3': 33,}
>>> b = {'2': 33,'4': 44,'5': 55,'6': 66,}
>>> a.update(b)
>>> print(a)
{'1': 11, '2': 33, '3': 33, '4': 44, '5': 55, '6': 66}
# 将字典b添加到a中，若有重复的key则用前者的value覆盖后者。

关于scope的使用可以参考tensorflow之scope使用，它能够控制变量名称的作用域，并且实现变量的重用，在神经网络比较复杂的情况下应用能够使Tensorboard绘制的graph更清晰，便于我们进行debug。

首先， assert语句获取了当前的变量作用域并判断其是否与self.scope相同，然后从in_expr中取出不为None的值expr作为有效输入存储在列表valid_inputs中。接下来改变了变量作用域，这里使用的tf.identity非常重要，它将变量、节点和graph流程计算联系在一起；运行pretrained.py时，第一次调用get_output_for会将G/latents_in和G/labels_in映射到G/G_mapping/latents_in和G/G_mapping/labels_in，即改变了变量的作用域。另外，由于设置了reuse=True，所以valid_inputs会重用in_expr变量。我们通过一个简单的示例来看一下这些操作所产生的效果：

发生了什么

## 仿照源码生成相同的scope和变量
from tensorflow.python.framework.tensor_shape import unknown_shape
with tf.device('/gpu:0'):
    with tf.name_scope("G"):
        in_expr=[tf.placeholder(float, shape = unknown_shape(), name = "latents_in"), 
                 tf.placeholder(float, shape = unknown_shape(), name = "labels_in")]#与源码相同，创建一个包含两个未知shapeTensor的列表
        input_shapes=[[None, 512], [None, 0]]
        input_names = ['latents_in', 'labels_in']
        scope = 'G_mapping'
        name = 'G_mapping'
        with absolute_variable_scope(scope, reuse=True), tf.name_scope(name):
         # reuse: 设置变量重用，当多次调用此函数时，若变量已经存在则不占用新的内存，而是将其指向同名变量的内存地址
            assert tf.get_variable_scope().name == scope
            valid_inputs = [expr for expr in in_expr if expr is not None]
            assert id(valid_inputs[0]) == id(in_expr[0])
            # python会重用它认为完全相同的两个变量，因此valid_inputs和in_expr
            # 指向了同一内存地址
            final_inputs = []
            for expr, name, shape in zip(in_expr, input_names, input_shapes):
                if expr is not None:
                    print('\033[31;47m before:\033[0m', name, expr)
                    expr = tf.identity(expr, name=name)
                    print('\033[31;47m after:\033[0m', name, expr)
                else:
                    expr = tf.zeros([tf.shape(valid_inputs[0])[0]] + shape[1:], name=name)
                final_inputs.append(expr)
"""
final_inpus: [<tf.Tensor 'G/G_mapping/latents_in:0' shape=<unknown> dtype=float32>, 
<tf.Tensor 'G/G_mapping/labels_in:0' shape=<unknown> dtype=float32>]
"""

tf.identity

"""
Signature: tf.identity(input, name=None)
Docstring:
返回与输入具有相同尺寸以及上下文的张量。

Args:
  input: Tensor.
  name: op的名字.

Returns:
  返回与输入具有相同类型的Tensor。
"""
x = tf.Variable(0.0, name = 'x')
plus = tf.assign_add(x, 1, name = 'plus') # 对'x'加1
with tf.control_dependencies([plus]):
    y = tf.identity(x, name = 'y') # y的更新将依赖于op plus
init = tf.global_variables_initializer()
with tf.Session() as sess:
    init.run()
    for i in range(3):
        print(sess.run(y), sess.run(x))
# [OUTPUT]:
1.0 1.0
2.0 2.0
3.0 3.0

以上函数中定义了一个作用在x上的op，它能够实现对变量plus和x的自增运算，tf.control_dependencies([plus])语境中的代码会在plus执行之后(即自增运算后)才执行，也就是sess.run(y)的运行会依赖于plus。

_build_func

这里的_build_func即为G_mapping,G_synthesis或者G_style函数，源码位于training/networks_stylegan.py中，数据流动如下所示：
set_shape可以改变placeholder的尺寸：

>>> test = tf.placeholder(float, shape = unknown_shape(), name = "Test")
# test.get_shape()= <unknown>
>>> test.set_shape([3, 512, 512])
# 这实际上涉及到张量流中动态形状和静态形状的概念，张量在graph图的流动过程中
# 形状是可能发生变化的
# 只有当变量存在至少一个维度不确定(为None或?)时才可以使用set_shape
# test.get_shape()= (3, 512, 512) 修改一次后不可再用set_shape改变形状

expr.set_shape(final.shape)即将输入的没有形状(unknown)的张量设置为期望形状[final.shape for final in final_inputs]。

Return

return out_expr返回生成的高分辨率图像。

GeophyAI

styleGAN源码解读之network.py(二)