ops.py

import tensorflow as tf
import numpy as np
from deformable_convolution import *


def deform_conv2d(inputs, num_outputs, kernel_size, scope, norm=True, d_format='NHWC'):
    
    # 生成offset-field
    offset = tf.contrib.layers.conv2d(
         inputs, kernel_size[0]*kernel_size[0]*2, [3,3], scope=scope+'/offset',
         data_format=d_format, activation_fn=None, weights_initializer=tf.zeros_initializer(dtype=tf.float32), biases_initializer=None)
    
    # 进行BN
    offset = tf.contrib.layers.batch_norm(
         offset, decay=0.9, center=True, activation_fn=tf.nn.tanh,
         updates_collections=None, epsilon=1e-5, scope=scope+'/offset'+'/batch_norm',
         data_format=d_format)
    
    # 生成deformed feature
    input_shape = [inputs.shape[0].value, inputs.shape[1].value, inputs.shape[2].value, inputs.shape[3].value]
    dcn = DCN(input_shape, kernel_size)
    deformed_feature = dcn.deform_conv(inputs, offset, scope)
    
    # 完成卷积操作
    outputs = tf.contrib.layers.conv2d(
        deformed_feature, num_outputs, kernel_size, scope=scope,
        stride=kernel_size[0], padding="VALID", data_format=d_format, 
        activation_fn=None, biases_initializer=None)
    
    if norm:
        outputs = tf.contrib.layers.batch_norm(
            outputs, decay=0.9, center=True, activation_fn=tf.nn.relu,
            updates_collections=None, epsilon=1e-5, scope=scope+'/batch_norm',
            data_format=d_format)
    else:
        outputs = tf.nn.relu(outputs, name=scope+'/relu')
    return outputs
    
    
def conv2d(inputs, num_outputs, kernel_size, scope, norm=True, d_format='NHWC'):
    outputs = tf.contrib.layers.conv2d(
        inputs, num_outputs, kernel_size, scope=scope,
        data_format=d_format, activation_fn=None, biases_initializer=None)
    if norm:
        outputs = tf.contrib.layers.batch_norm(
            outputs, decay=0.9, center=True, activation_fn=tf.nn.relu,
            updates_collections=None, epsilon=1e-5, scope=scope+'/batch_norm',
            data_format=d_format)
    else:
        outputs = tf.nn.relu(outputs, name=scope+'/relu')
    return outputs


def co_conv2d(inputs, out_num, kernel_size, scope, norm=True, d_format='NHWC'):
    conv1 = tf.contrib.layers.conv2d(
        inputs, out_num, kernel_size, stride=2, scope=scope+'/conv0',
        data_format=d_format, activation_fn=None, biases_initializer=None)
    outputs = dilated_conv(conv1, out_num, kernel_size, scope)
    return outputs


def deconv(inputs, out_num, kernel_size, scope, d_format='NHWC'):
    outputs = tf.contrib.layers.conv2d_transpose(
        inputs, out_num, kernel_size, scope=scope, stride=[2, 2],
        data_format=d_format, activation_fn=None, biases_initializer=None)
    return tf.contrib.layers.batch_norm(
        outputs, decay=0.9, activation_fn=tf.nn.relu, updates_collections=None,
        epsilon=1e-5, scope=scope+'/batch_norm', data_format=d_format)


def co_dilated_conv(inputs, out_num, kernel_size, scope, d_format='NHWC'):
    axis = (d_format.index('H'), d_format.index('W'))
    channel_axis = d_format.index('C')
    conv1 = conv2d(inputs, out_num, kernel_size, scope+'/conv1', False)
    conv1_concat = tf.concat(
        [inputs, conv1], channel_axis, name=scope+'/concat1')
    conv2 = conv2d(conv1_concat, out_num, kernel_size, scope+'/conv2', False)
    conv2_concat = tf.concat(
        [conv1_concat, conv2], channel_axis, name=scope+'/concat2')
    conv3 = conv2d(conv2_concat, 2*out_num, kernel_size, scope+'/conv3', False)
    conv4, conv5 = tf.split(conv3, 2, channel_axis, name=scope+'/split')
    dialte1 = dilate_tensor(conv1, axis, 0, 0, scope+'/dialte1')
    dialte2 = dilate_tensor(conv2, axis, 1, 1, scope+'/dialte2')
    dialte3 = dilate_tensor(conv4, axis, 1, 0, scope+'/dialte3')
    dialte4 = dilate_tensor(conv5, axis, 0, 1, scope+'/dialte4')
    outputs = tf.add_n([dialte1, dialte2, dialte3, dialte4], scope+'/add')
    return tf.contrib.layers.batch_norm(
        outputs, decay=0.9, activation_fn=tf.nn.relu, updates_collections=None,
        epsilon=1e-5, scope=scope+'/batch_norm', data_format=d_format)


def dilated_conv(inputs, out_num, kernel_size, scope, d_format='NHWC'):
    axis = (d_format.index('H'), d_format.index('W'))
    conv1 = conv2d(inputs, out_num, kernel_size, scope+'/conv1', False)
    dilated_inputs = dilate_tensor(inputs, axis, 0, 0, scope+'/dialte_inputs')
    dilated_conv1 = dilate_tensor(conv1, axis, 1, 1, scope+'/dialte_conv1')
    conv1 = tf.add(dilated_inputs, dilated_conv1, scope+'/add1')
    with tf.variable_scope(scope+'/conv2'):
        shape = list(kernel_size) + [out_num, out_num]
        weights = tf.get_variable(
            'weights', shape, initializer=tf.truncated_normal_initializer())
        weights = tf.multiply(weights, get_mask(shape, scope))
        strides = [1, 1, 1, 1]
        conv2 = tf.nn.conv2d(conv1, weights, strides, padding='SAME',
                             data_format=d_format)
    outputs = tf.add(conv1, conv2, name=scope+'/add2')
    return tf.contrib.layers.batch_norm(
        outputs, decay=0.9, activation_fn=tf.nn.relu, updates_collections=None,
        epsilon=1e-5, scope=scope+'/batch_norm', data_format=d_format)


def get_mask(shape, scope):
    new_shape = (shape[0]*shape[1], shape[2], shape[3])
    mask = np.ones(new_shape, dtype=np.float32)
    for i in range(0, new_shape[0], 2):
        mask[i, :, :] = 0
    mask = np.reshape(mask, shape, 'F')
    return tf.constant(mask, dtype=tf.float32, name=scope+'/mask')


def dilate_tensor(inputs, axis, row_shift, column_shift, scope):
    rows = tf.unstack(inputs, axis=axis[0], name=scope+'/rowsunstack')
    row_zeros = tf.zeros(
        rows[0].shape, dtype=tf.float32, name=scope+'/rowzeros')
    for index in range(len(rows), 0, -1):
        rows.insert(index-row_shift, row_zeros)
    row_outputs = tf.stack(rows, axis=axis[0], name=scope+'/rowsstack')
    columns = tf.unstack(
        row_outputs, axis=axis[1], name=scope+'/columnsunstack')
    columns_zeros = tf.zeros(
        columns[0].shape, dtype=tf.float32, name=scope+'/columnzeros')
    for index in range(len(columns), 0, -1):
        columns.insert(index-column_shift, columns_zeros)
    column_outputs = tf.stack(
        columns, axis=axis[1], name=scope+'/columnsstack')
    return column_outputs


def pool2d(inputs, kernel_size, scope, data_format='NHWC'):
    return tf.contrib.layers.max_pool2d(
        inputs, kernel_size, scope=scope, padding='SAME',
        data_format=data_format)

def weight_variable(shape):
    initial = tf.zeros(shape)
    return tf.Variable(initial)

def bias_variable(shape):
    initial = tf.random_normal(shape, mean=0.0, stddev=0.01)
    return tf.Variable(initial)