mobilenet.py 6.47 KB
Newer Older
eqy committed
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25
# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements.  See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership.  The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License.  You may obtain a copy of the License at
#
#   http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied.  See the License for the
# specific language governing permissions and limitations
# under the License.
"""
Port of NNVM version of MobileNet to Relay.
"""
# pylint: disable=invalid-name

from tvm import relay
from . import layers
from .init import create_workload

26

eqy committed
27
def conv_block(data, name, channels, kernel_size=(3, 3), strides=(1, 1),
28
               padding=(1, 1), epsilon=1e-5, layout='NCHW'):
eqy committed
29 30 31 32 33 34 35 36
    """Helper function to construct conv_bn-relu"""
    # convolution + bn + relu
    conv = layers.conv2d(
        data=data,
        channels=channels,
        kernel_size=kernel_size,
        strides=strides,
        padding=padding,
37 38
        data_layout=layout,
        kernel_layout=layers.conv_kernel_layout(layout),
eqy committed
39 40 41 42 43 44 45 46
        name=name+'_conv')
    bn = layers.batch_norm_infer(data=conv, epsilon=epsilon, name=name + '_bn')
    act = relay.nn.relu(data=bn)
    return act


def separable_conv_block(data, name, depthwise_channels, pointwise_channels,
                         kernel_size=(3, 3), downsample=False, padding=(1, 1),
47
                         epsilon=1e-5, layout='NCHW'):
eqy committed
48 49 50 51 52 53 54 55 56 57 58 59 60
    """Helper function to get a separable conv block"""
    if downsample:
        strides = (2, 2)
    else:
        strides = (1, 1)
    # depthwise convolution + bn + relu
    conv1 = layers.conv2d(
        data=data,
        channels=depthwise_channels,
        groups=depthwise_channels,
        kernel_size=kernel_size,
        strides=strides,
        padding=padding,
61 62
        data_layout=layout,
        kernel_layout=layers.conv_kernel_layout(layout, True),
eqy committed
63 64 65 66 67 68 69 70 71 72
        name=name+'_depthwise_conv1')
    bn1 = layers.batch_norm_infer(data=conv1, epsilon=epsilon, name=name+'_bn1')
    act1 = relay.nn.relu(data=bn1)
    # pointwise convolution + bn + relu
    conv2 = layers.conv2d(
        data=act1,
        channels=pointwise_channels,
        kernel_size=(1, 1),
        strides=(1, 1),
        padding=(0, 0),
73 74
        data_layout=layout,
        kernel_layout=layers.conv_kernel_layout(layout),
eqy committed
75 76 77 78 79 80 81
        name=name + '_conv2')
    bn2 = layers.batch_norm_infer(data=conv2, epsilon=epsilon, name=name+'_bn2')
    act2 = relay.nn.relu(data=bn2)
    return act2


def mobile_net(num_classes=1000, data_shape=(1, 3, 224, 224),
82
               dtype='float32', alpha=1.0, is_shallow=False, layout='NCHW'):
eqy committed
83 84
    """Function to construct a MobileNet"""
    data = relay.var("data", shape=data_shape, dtype=dtype)
85 86
    body = conv_block(data, 'conv_block_1', int(32*alpha), strides=(2, 2),
                      layout=layout)
eqy committed
87
    body = separable_conv_block(body, 'separable_conv_block_1',
88
                                int(32*alpha), int(64*alpha), layout=layout)
eqy committed
89
    body = separable_conv_block(body, 'separable_conv_block_2',
90 91
                                int(64*alpha), int(128*alpha), downsample=True,
                                layout=layout)
eqy committed
92
    body = separable_conv_block(body, 'separable_conv_block_3',
93
                                int(128*alpha), int(128*alpha), layout=layout)
eqy committed
94
    body = separable_conv_block(body, 'separable_conv_block_4',
95 96
                                int(128*alpha), int(256*alpha), downsample=True,
                                layout=layout)
eqy committed
97
    body = separable_conv_block(body, 'separable_conv_block_5',
98
                                int(256*alpha), int(256*alpha), layout=layout)
eqy committed
99
    body = separable_conv_block(body, 'separable_conv_block_6',
100 101
                                int(256*alpha), int(512*alpha), downsample=True,
                                layout=layout)
eqy committed
102 103
    if is_shallow:
        body = separable_conv_block(body, 'separable_conv_block_7',
104 105
                                    int(512*alpha), int(1024*alpha),
                                    downsample=True, layout=layout)
eqy committed
106
        body = separable_conv_block(body, 'separable_conv_block_8',
107 108
                                    int(1024*alpha), int(1024*alpha),
                                    downsample=True, layout=layout)
eqy committed
109 110 111
    else:
        for i in range(7, 12):
            body = separable_conv_block(body, 'separable_conv_block_%d' % i,
112 113
                                        int(512*alpha), int(512*alpha),
                                        layout=layout)
eqy committed
114
        body = separable_conv_block(body, 'separable_conv_block_12',
115 116
                                    int(512*alpha), int(1024*alpha),
                                    downsample=True, layout=layout)
eqy committed
117
        body = separable_conv_block(body, 'separable_conv_block_13',
118 119 120
                                    int(1024*alpha), int(1024*alpha),
                                    layout=layout)
    pool = relay.nn.global_avg_pool2d(data=body, layout=layout)
eqy committed
121 122 123 124
    flatten = relay.nn.batch_flatten(data=pool)
    weight = relay.var('fc_weight')
    fc = relay.nn.dense(data=flatten, weight=weight, units=num_classes)
    softmax = relay.nn.softmax(data=fc)
Zhi committed
125
    return relay.Function(relay.analysis.free_vars(softmax), softmax)
eqy committed
126 127


128 129
def get_workload(batch_size=1, num_classes=1000, image_shape=(3, 224, 224),
                 dtype='float32', layout='NCHW'):
eqy committed
130 131 132 133 134 135 136 137 138 139 140
    """Get benchmark workload for mobilenet

    Parameters
    ----------
    batch_size : int, optional
        The batch size used in the model

    num_classes : int, optional
        Number of classes

    image_shape : tuple, optional
141
        The input image shape, cooperate with layout
eqy committed
142 143 144 145

    dtype : str, optional
        The data type

146 147 148 149
    layout : str, optional
        The data layout of image_shape and the operators
        cooperate with image_shape

eqy committed
150 151
    Returns
    -------
152 153
    mod : tvm.relay.Module
        The relay module that contains a MobileNet network.
eqy committed
154 155 156 157 158 159

    params : dict of str to NDArray
        The parameters.
    """
    data_shape = tuple([batch_size] + list(image_shape))
    net = mobile_net(num_classes=num_classes, data_shape=data_shape,
160 161
                     dtype=dtype, alpha=1.0, is_shallow=False,
                     layout=layout)
eqy committed
162
    return create_workload(net)