In [1]:
import mxnet as mx 
from symbol import get_resnet_model
from symbol import YOLO_loss
from data_ulti import get_iterator

In [2]:
# get sym 
sym = get_resnet_model('resnet-50', 0)
_, args_params, aux_params = mx.model.load_checkpoint('resnet-50', 0)
logit = sym.get_internals()['logit_output']
mx.viz.plot_network(sym)


Out[2]:
plot data data bn_data_gamma bn_data_gamma bn_data_beta bn_data_beta bn_data_moving_mean bn_data_moving_mean bn_data_moving_var bn_data_moving_var bn_data bn_data bn_data->data bn_data->bn_data_gamma bn_data->bn_data_beta bn_data->bn_data_moving_mean bn_data->bn_data_moving_var conv0 Convolution 7x7/2x2, 64 conv0->bn_data bn0_gamma bn0_gamma bn0_beta bn0_beta bn0_moving_mean bn0_moving_mean bn0_moving_var bn0_moving_var bn0 bn0 bn0->conv0 bn0->bn0_gamma bn0->bn0_beta bn0->bn0_moving_mean bn0->bn0_moving_var relu0 Activation relu relu0->bn0 pooling0 Pooling max, 3x3/2x2 pooling0->relu0 stage1_unit1_bn1_gamma stage1_unit1_bn1_gamma stage1_unit1_bn1_beta stage1_unit1_bn1_beta stage1_unit1_bn1_moving_mean stage1_unit1_bn1_moving_mean stage1_unit1_bn1_moving_var stage1_unit1_bn1_moving_var stage1_unit1_bn1 stage1_unit1_bn1 stage1_unit1_bn1->pooling0 stage1_unit1_bn1->stage1_unit1_bn1_gamma stage1_unit1_bn1->stage1_unit1_bn1_beta stage1_unit1_bn1->stage1_unit1_bn1_moving_mean stage1_unit1_bn1->stage1_unit1_bn1_moving_var stage1_unit1_relu1 Activation relu stage1_unit1_relu1->stage1_unit1_bn1 stage1_unit1_conv1 Convolution 1x1/1x1, 64 stage1_unit1_conv1->stage1_unit1_relu1 stage1_unit1_bn2_gamma stage1_unit1_bn2_gamma stage1_unit1_bn2_beta stage1_unit1_bn2_beta stage1_unit1_bn2_moving_mean stage1_unit1_bn2_moving_mean stage1_unit1_bn2_moving_var stage1_unit1_bn2_moving_var stage1_unit1_bn2 stage1_unit1_bn2 stage1_unit1_bn2->stage1_unit1_conv1 stage1_unit1_bn2->stage1_unit1_bn2_gamma stage1_unit1_bn2->stage1_unit1_bn2_beta stage1_unit1_bn2->stage1_unit1_bn2_moving_mean stage1_unit1_bn2->stage1_unit1_bn2_moving_var stage1_unit1_relu2 Activation relu stage1_unit1_relu2->stage1_unit1_bn2 stage1_unit1_conv2 Convolution 3x3/1x1, 64 stage1_unit1_conv2->stage1_unit1_relu2 stage1_unit1_bn3_gamma stage1_unit1_bn3_gamma stage1_unit1_bn3_beta stage1_unit1_bn3_beta stage1_unit1_bn3_moving_mean stage1_unit1_bn3_moving_mean stage1_unit1_bn3_moving_var stage1_unit1_bn3_moving_var stage1_unit1_bn3 stage1_unit1_bn3 stage1_unit1_bn3->stage1_unit1_conv2 stage1_unit1_bn3->stage1_unit1_bn3_gamma stage1_unit1_bn3->stage1_unit1_bn3_beta stage1_unit1_bn3->stage1_unit1_bn3_moving_mean stage1_unit1_bn3->stage1_unit1_bn3_moving_var stage1_unit1_relu3 Activation relu stage1_unit1_relu3->stage1_unit1_bn3 stage1_unit1_conv3 Convolution 1x1/1x1, 256 stage1_unit1_conv3->stage1_unit1_relu3 stage1_unit1_sc Convolution 1x1/1x1, 256 stage1_unit1_sc->stage1_unit1_relu1 _plus0 _plus0 _plus0->stage1_unit1_conv3 _plus0->stage1_unit1_sc _mulscalar0 _mulscalar0 _plus0->_mulscalar0 _divscalar1 _divscalar1 _plus0->_divscalar1 stage1_unit2_bn1_gamma stage1_unit2_bn1_gamma stage1_unit2_bn1_beta stage1_unit2_bn1_beta stage1_unit2_bn1_moving_mean stage1_unit2_bn1_moving_mean stage1_unit2_bn1_moving_var stage1_unit2_bn1_moving_var stage1_unit2_bn1 stage1_unit2_bn1 stage1_unit2_bn1->_plus0 stage1_unit2_bn1->stage1_unit2_bn1_gamma stage1_unit2_bn1->stage1_unit2_bn1_beta stage1_unit2_bn1->stage1_unit2_bn1_moving_mean stage1_unit2_bn1->stage1_unit2_bn1_moving_var stage1_unit2_relu1 Activation relu stage1_unit2_relu1->stage1_unit2_bn1 stage1_unit2_conv1 Convolution 1x1/1x1, 64 stage1_unit2_conv1->stage1_unit2_relu1 stage1_unit2_bn2_gamma stage1_unit2_bn2_gamma stage1_unit2_bn2_beta stage1_unit2_bn2_beta stage1_unit2_bn2_moving_mean stage1_unit2_bn2_moving_mean stage1_unit2_bn2_moving_var stage1_unit2_bn2_moving_var stage1_unit2_bn2 stage1_unit2_bn2 stage1_unit2_bn2->stage1_unit2_conv1 stage1_unit2_bn2->stage1_unit2_bn2_gamma stage1_unit2_bn2->stage1_unit2_bn2_beta stage1_unit2_bn2->stage1_unit2_bn2_moving_mean stage1_unit2_bn2->stage1_unit2_bn2_moving_var stage1_unit2_relu2 Activation relu stage1_unit2_relu2->stage1_unit2_bn2 stage1_unit2_conv2 Convolution 3x3/1x1, 64 stage1_unit2_conv2->stage1_unit2_relu2 stage1_unit2_bn3_gamma stage1_unit2_bn3_gamma stage1_unit2_bn3_beta stage1_unit2_bn3_beta stage1_unit2_bn3_moving_mean stage1_unit2_bn3_moving_mean stage1_unit2_bn3_moving_var stage1_unit2_bn3_moving_var stage1_unit2_bn3 stage1_unit2_bn3 stage1_unit2_bn3->stage1_unit2_conv2 stage1_unit2_bn3->stage1_unit2_bn3_gamma stage1_unit2_bn3->stage1_unit2_bn3_beta stage1_unit2_bn3->stage1_unit2_bn3_moving_mean stage1_unit2_bn3->stage1_unit2_bn3_moving_var stage1_unit2_relu3 Activation relu stage1_unit2_relu3->stage1_unit2_bn3 stage1_unit2_conv3 Convolution 1x1/1x1, 256 stage1_unit2_conv3->stage1_unit2_relu3 _plus1 _plus1 _plus1->_plus0 _plus1->stage1_unit2_conv3 stage1_unit3_bn1_gamma stage1_unit3_bn1_gamma stage1_unit3_bn1_beta stage1_unit3_bn1_beta stage1_unit3_bn1_moving_mean stage1_unit3_bn1_moving_mean stage1_unit3_bn1_moving_var stage1_unit3_bn1_moving_var stage1_unit3_bn1 stage1_unit3_bn1 stage1_unit3_bn1->_plus1 stage1_unit3_bn1->stage1_unit3_bn1_gamma stage1_unit3_bn1->stage1_unit3_bn1_beta stage1_unit3_bn1->stage1_unit3_bn1_moving_mean stage1_unit3_bn1->stage1_unit3_bn1_moving_var stage1_unit3_relu1 Activation relu stage1_unit3_relu1->stage1_unit3_bn1 stage1_unit3_conv1 Convolution 1x1/1x1, 64 stage1_unit3_conv1->stage1_unit3_relu1 stage1_unit3_bn2_gamma stage1_unit3_bn2_gamma stage1_unit3_bn2_beta stage1_unit3_bn2_beta stage1_unit3_bn2_moving_mean stage1_unit3_bn2_moving_mean stage1_unit3_bn2_moving_var stage1_unit3_bn2_moving_var stage1_unit3_bn2 stage1_unit3_bn2 stage1_unit3_bn2->stage1_unit3_conv1 stage1_unit3_bn2->stage1_unit3_bn2_gamma stage1_unit3_bn2->stage1_unit3_bn2_beta stage1_unit3_bn2->stage1_unit3_bn2_moving_mean stage1_unit3_bn2->stage1_unit3_bn2_moving_var stage1_unit3_relu2 Activation relu stage1_unit3_relu2->stage1_unit3_bn2 stage1_unit3_conv2 Convolution 3x3/1x1, 64 stage1_unit3_conv2->stage1_unit3_relu2 stage1_unit3_bn3_gamma stage1_unit3_bn3_gamma stage1_unit3_bn3_beta stage1_unit3_bn3_beta stage1_unit3_bn3_moving_mean stage1_unit3_bn3_moving_mean stage1_unit3_bn3_moving_var stage1_unit3_bn3_moving_var stage1_unit3_bn3 stage1_unit3_bn3 stage1_unit3_bn3->stage1_unit3_conv2 stage1_unit3_bn3->stage1_unit3_bn3_gamma stage1_unit3_bn3->stage1_unit3_bn3_beta stage1_unit3_bn3->stage1_unit3_bn3_moving_mean stage1_unit3_bn3->stage1_unit3_bn3_moving_var stage1_unit3_relu3 Activation relu stage1_unit3_relu3->stage1_unit3_bn3 stage1_unit3_conv3 Convolution 1x1/1x1, 256 stage1_unit3_conv3->stage1_unit3_relu3 _plus2 _plus2 _plus2->_plus1 _plus2->stage1_unit3_conv3 stage2_unit1_bn1_gamma stage2_unit1_bn1_gamma stage2_unit1_bn1_beta stage2_unit1_bn1_beta stage2_unit1_bn1_moving_mean stage2_unit1_bn1_moving_mean stage2_unit1_bn1_moving_var stage2_unit1_bn1_moving_var stage2_unit1_bn1 stage2_unit1_bn1 stage2_unit1_bn1->_plus2 stage2_unit1_bn1->stage2_unit1_bn1_gamma stage2_unit1_bn1->stage2_unit1_bn1_beta stage2_unit1_bn1->stage2_unit1_bn1_moving_mean stage2_unit1_bn1->stage2_unit1_bn1_moving_var stage2_unit1_relu1 Activation relu stage2_unit1_relu1->stage2_unit1_bn1 stage2_unit1_conv1 Convolution 1x1/1x1, 128 stage2_unit1_conv1->stage2_unit1_relu1 stage2_unit1_bn2_gamma stage2_unit1_bn2_gamma stage2_unit1_bn2_beta stage2_unit1_bn2_beta stage2_unit1_bn2_moving_mean stage2_unit1_bn2_moving_mean stage2_unit1_bn2_moving_var stage2_unit1_bn2_moving_var stage2_unit1_bn2 stage2_unit1_bn2 stage2_unit1_bn2->stage2_unit1_conv1 stage2_unit1_bn2->stage2_unit1_bn2_gamma stage2_unit1_bn2->stage2_unit1_bn2_beta stage2_unit1_bn2->stage2_unit1_bn2_moving_mean stage2_unit1_bn2->stage2_unit1_bn2_moving_var stage2_unit1_relu2 Activation relu stage2_unit1_relu2->stage2_unit1_bn2 stage2_unit1_conv2 Convolution 3x3/2x2, 128 stage2_unit1_conv2->stage2_unit1_relu2 stage2_unit1_bn3_gamma stage2_unit1_bn3_gamma stage2_unit1_bn3_beta stage2_unit1_bn3_beta stage2_unit1_bn3_moving_mean stage2_unit1_bn3_moving_mean stage2_unit1_bn3_moving_var stage2_unit1_bn3_moving_var stage2_unit1_bn3 stage2_unit1_bn3 stage2_unit1_bn3->stage2_unit1_conv2 stage2_unit1_bn3->stage2_unit1_bn3_gamma stage2_unit1_bn3->stage2_unit1_bn3_beta stage2_unit1_bn3->stage2_unit1_bn3_moving_mean stage2_unit1_bn3->stage2_unit1_bn3_moving_var stage2_unit1_relu3 Activation relu stage2_unit1_relu3->stage2_unit1_bn3 stage2_unit1_conv3 Convolution 1x1/1x1, 512 stage2_unit1_conv3->stage2_unit1_relu3 stage2_unit1_sc Convolution 1x1/2x2, 512 stage2_unit1_sc->stage2_unit1_relu1 _plus3 _plus3 _plus3->stage2_unit1_conv3 _plus3->stage2_unit1_sc stage2_unit2_bn1_gamma stage2_unit2_bn1_gamma stage2_unit2_bn1_beta stage2_unit2_bn1_beta stage2_unit2_bn1_moving_mean stage2_unit2_bn1_moving_mean stage2_unit2_bn1_moving_var stage2_unit2_bn1_moving_var stage2_unit2_bn1 stage2_unit2_bn1 stage2_unit2_bn1->_plus3 stage2_unit2_bn1->stage2_unit2_bn1_gamma stage2_unit2_bn1->stage2_unit2_bn1_beta stage2_unit2_bn1->stage2_unit2_bn1_moving_mean stage2_unit2_bn1->stage2_unit2_bn1_moving_var stage2_unit2_relu1 Activation relu stage2_unit2_relu1->stage2_unit2_bn1 stage2_unit2_conv1 Convolution 1x1/1x1, 128 stage2_unit2_conv1->stage2_unit2_relu1 stage2_unit2_bn2_gamma stage2_unit2_bn2_gamma stage2_unit2_bn2_beta stage2_unit2_bn2_beta stage2_unit2_bn2_moving_mean stage2_unit2_bn2_moving_mean stage2_unit2_bn2_moving_var stage2_unit2_bn2_moving_var stage2_unit2_bn2 stage2_unit2_bn2 stage2_unit2_bn2->stage2_unit2_conv1 stage2_unit2_bn2->stage2_unit2_bn2_gamma stage2_unit2_bn2->stage2_unit2_bn2_beta stage2_unit2_bn2->stage2_unit2_bn2_moving_mean stage2_unit2_bn2->stage2_unit2_bn2_moving_var stage2_unit2_relu2 Activation relu stage2_unit2_relu2->stage2_unit2_bn2 stage2_unit2_conv2 Convolution 3x3/1x1, 128 stage2_unit2_conv2->stage2_unit2_relu2 stage2_unit2_bn3_gamma stage2_unit2_bn3_gamma stage2_unit2_bn3_beta stage2_unit2_bn3_beta stage2_unit2_bn3_moving_mean stage2_unit2_bn3_moving_mean stage2_unit2_bn3_moving_var stage2_unit2_bn3_moving_var stage2_unit2_bn3 stage2_unit2_bn3 stage2_unit2_bn3->stage2_unit2_conv2 stage2_unit2_bn3->stage2_unit2_bn3_gamma stage2_unit2_bn3->stage2_unit2_bn3_beta stage2_unit2_bn3->stage2_unit2_bn3_moving_mean stage2_unit2_bn3->stage2_unit2_bn3_moving_var stage2_unit2_relu3 Activation relu stage2_unit2_relu3->stage2_unit2_bn3 stage2_unit2_conv3 Convolution 1x1/1x1, 512 stage2_unit2_conv3->stage2_unit2_relu3 _plus4 _plus4 _plus4->_plus3 _plus4->stage2_unit2_conv3 stage2_unit3_bn1_gamma stage2_unit3_bn1_gamma stage2_unit3_bn1_beta stage2_unit3_bn1_beta stage2_unit3_bn1_moving_mean stage2_unit3_bn1_moving_mean stage2_unit3_bn1_moving_var stage2_unit3_bn1_moving_var stage2_unit3_bn1 stage2_unit3_bn1 stage2_unit3_bn1->_plus4 stage2_unit3_bn1->stage2_unit3_bn1_gamma stage2_unit3_bn1->stage2_unit3_bn1_beta stage2_unit3_bn1->stage2_unit3_bn1_moving_mean stage2_unit3_bn1->stage2_unit3_bn1_moving_var stage2_unit3_relu1 Activation relu stage2_unit3_relu1->stage2_unit3_bn1 stage2_unit3_conv1 Convolution 1x1/1x1, 128 stage2_unit3_conv1->stage2_unit3_relu1 stage2_unit3_bn2_gamma stage2_unit3_bn2_gamma stage2_unit3_bn2_beta stage2_unit3_bn2_beta stage2_unit3_bn2_moving_mean stage2_unit3_bn2_moving_mean stage2_unit3_bn2_moving_var stage2_unit3_bn2_moving_var stage2_unit3_bn2 stage2_unit3_bn2 stage2_unit3_bn2->stage2_unit3_conv1 stage2_unit3_bn2->stage2_unit3_bn2_gamma stage2_unit3_bn2->stage2_unit3_bn2_beta stage2_unit3_bn2->stage2_unit3_bn2_moving_mean stage2_unit3_bn2->stage2_unit3_bn2_moving_var stage2_unit3_relu2 Activation relu stage2_unit3_relu2->stage2_unit3_bn2 stage2_unit3_conv2 Convolution 3x3/1x1, 128 stage2_unit3_conv2->stage2_unit3_relu2 stage2_unit3_bn3_gamma stage2_unit3_bn3_gamma stage2_unit3_bn3_beta stage2_unit3_bn3_beta stage2_unit3_bn3_moving_mean stage2_unit3_bn3_moving_mean stage2_unit3_bn3_moving_var stage2_unit3_bn3_moving_var stage2_unit3_bn3 stage2_unit3_bn3 stage2_unit3_bn3->stage2_unit3_conv2 stage2_unit3_bn3->stage2_unit3_bn3_gamma stage2_unit3_bn3->stage2_unit3_bn3_beta stage2_unit3_bn3->stage2_unit3_bn3_moving_mean stage2_unit3_bn3->stage2_unit3_bn3_moving_var stage2_unit3_relu3 Activation relu stage2_unit3_relu3->stage2_unit3_bn3 stage2_unit3_conv3 Convolution 1x1/1x1, 512 stage2_unit3_conv3->stage2_unit3_relu3 _plus5 _plus5 _plus5->_plus4 _plus5->stage2_unit3_conv3 stage2_unit4_bn1_gamma stage2_unit4_bn1_gamma stage2_unit4_bn1_beta stage2_unit4_bn1_beta stage2_unit4_bn1_moving_mean stage2_unit4_bn1_moving_mean stage2_unit4_bn1_moving_var stage2_unit4_bn1_moving_var stage2_unit4_bn1 stage2_unit4_bn1 stage2_unit4_bn1->_plus5 stage2_unit4_bn1->stage2_unit4_bn1_gamma stage2_unit4_bn1->stage2_unit4_bn1_beta stage2_unit4_bn1->stage2_unit4_bn1_moving_mean stage2_unit4_bn1->stage2_unit4_bn1_moving_var stage2_unit4_relu1 Activation relu stage2_unit4_relu1->stage2_unit4_bn1 stage2_unit4_conv1 Convolution 1x1/1x1, 128 stage2_unit4_conv1->stage2_unit4_relu1 stage2_unit4_bn2_gamma stage2_unit4_bn2_gamma stage2_unit4_bn2_beta stage2_unit4_bn2_beta stage2_unit4_bn2_moving_mean stage2_unit4_bn2_moving_mean stage2_unit4_bn2_moving_var stage2_unit4_bn2_moving_var stage2_unit4_bn2 stage2_unit4_bn2 stage2_unit4_bn2->stage2_unit4_conv1 stage2_unit4_bn2->stage2_unit4_bn2_gamma stage2_unit4_bn2->stage2_unit4_bn2_beta stage2_unit4_bn2->stage2_unit4_bn2_moving_mean stage2_unit4_bn2->stage2_unit4_bn2_moving_var stage2_unit4_relu2 Activation relu stage2_unit4_relu2->stage2_unit4_bn2 stage2_unit4_conv2 Convolution 3x3/1x1, 128 stage2_unit4_conv2->stage2_unit4_relu2 stage2_unit4_bn3_gamma stage2_unit4_bn3_gamma stage2_unit4_bn3_beta stage2_unit4_bn3_beta stage2_unit4_bn3_moving_mean stage2_unit4_bn3_moving_mean stage2_unit4_bn3_moving_var stage2_unit4_bn3_moving_var stage2_unit4_bn3 stage2_unit4_bn3 stage2_unit4_bn3->stage2_unit4_conv2 stage2_unit4_bn3->stage2_unit4_bn3_gamma stage2_unit4_bn3->stage2_unit4_bn3_beta stage2_unit4_bn3->stage2_unit4_bn3_moving_mean stage2_unit4_bn3->stage2_unit4_bn3_moving_var stage2_unit4_relu3 Activation relu stage2_unit4_relu3->stage2_unit4_bn3 stage2_unit4_conv3 Convolution 1x1/1x1, 512 stage2_unit4_conv3->stage2_unit4_relu3 _plus6 _plus6 _plus6->_plus5 _plus6->stage2_unit4_conv3 stage3_unit1_bn1_gamma stage3_unit1_bn1_gamma stage3_unit1_bn1_beta stage3_unit1_bn1_beta stage3_unit1_bn1_moving_mean stage3_unit1_bn1_moving_mean stage3_unit1_bn1_moving_var stage3_unit1_bn1_moving_var stage3_unit1_bn1 stage3_unit1_bn1 stage3_unit1_bn1->_plus6 stage3_unit1_bn1->stage3_unit1_bn1_gamma stage3_unit1_bn1->stage3_unit1_bn1_beta stage3_unit1_bn1->stage3_unit1_bn1_moving_mean stage3_unit1_bn1->stage3_unit1_bn1_moving_var stage3_unit1_relu1 Activation relu stage3_unit1_relu1->stage3_unit1_bn1 stage3_unit1_conv1 Convolution 1x1/1x1, 256 stage3_unit1_conv1->stage3_unit1_relu1 stage3_unit1_bn2_gamma stage3_unit1_bn2_gamma stage3_unit1_bn2_beta stage3_unit1_bn2_beta stage3_unit1_bn2_moving_mean stage3_unit1_bn2_moving_mean stage3_unit1_bn2_moving_var stage3_unit1_bn2_moving_var stage3_unit1_bn2 stage3_unit1_bn2 stage3_unit1_bn2->stage3_unit1_conv1 stage3_unit1_bn2->stage3_unit1_bn2_gamma stage3_unit1_bn2->stage3_unit1_bn2_beta stage3_unit1_bn2->stage3_unit1_bn2_moving_mean stage3_unit1_bn2->stage3_unit1_bn2_moving_var stage3_unit1_relu2 Activation relu stage3_unit1_relu2->stage3_unit1_bn2 stage3_unit1_conv2 Convolution 3x3/2x2, 256 stage3_unit1_conv2->stage3_unit1_relu2 stage3_unit1_bn3_gamma stage3_unit1_bn3_gamma stage3_unit1_bn3_beta stage3_unit1_bn3_beta stage3_unit1_bn3_moving_mean stage3_unit1_bn3_moving_mean stage3_unit1_bn3_moving_var stage3_unit1_bn3_moving_var stage3_unit1_bn3 stage3_unit1_bn3 stage3_unit1_bn3->stage3_unit1_conv2 stage3_unit1_bn3->stage3_unit1_bn3_gamma stage3_unit1_bn3->stage3_unit1_bn3_beta stage3_unit1_bn3->stage3_unit1_bn3_moving_mean stage3_unit1_bn3->stage3_unit1_bn3_moving_var stage3_unit1_relu3 Activation relu stage3_unit1_relu3->stage3_unit1_bn3 stage3_unit1_conv3 Convolution 1x1/1x1, 1024 stage3_unit1_conv3->stage3_unit1_relu3 stage3_unit1_sc Convolution 1x1/2x2, 1024 stage3_unit1_sc->stage3_unit1_relu1 _plus7 _plus7 _plus7->stage3_unit1_conv3 _plus7->stage3_unit1_sc stage3_unit2_bn1_gamma stage3_unit2_bn1_gamma stage3_unit2_bn1_beta stage3_unit2_bn1_beta stage3_unit2_bn1_moving_mean stage3_unit2_bn1_moving_mean stage3_unit2_bn1_moving_var stage3_unit2_bn1_moving_var stage3_unit2_bn1 stage3_unit2_bn1 stage3_unit2_bn1->_plus7 stage3_unit2_bn1->stage3_unit2_bn1_gamma stage3_unit2_bn1->stage3_unit2_bn1_beta stage3_unit2_bn1->stage3_unit2_bn1_moving_mean stage3_unit2_bn1->stage3_unit2_bn1_moving_var stage3_unit2_relu1 Activation relu stage3_unit2_relu1->stage3_unit2_bn1 stage3_unit2_conv1 Convolution 1x1/1x1, 256 stage3_unit2_conv1->stage3_unit2_relu1 stage3_unit2_bn2_gamma stage3_unit2_bn2_gamma stage3_unit2_bn2_beta stage3_unit2_bn2_beta stage3_unit2_bn2_moving_mean stage3_unit2_bn2_moving_mean stage3_unit2_bn2_moving_var stage3_unit2_bn2_moving_var stage3_unit2_bn2 stage3_unit2_bn2 stage3_unit2_bn2->stage3_unit2_conv1 stage3_unit2_bn2->stage3_unit2_bn2_gamma stage3_unit2_bn2->stage3_unit2_bn2_beta stage3_unit2_bn2->stage3_unit2_bn2_moving_mean stage3_unit2_bn2->stage3_unit2_bn2_moving_var stage3_unit2_relu2 Activation relu stage3_unit2_relu2->stage3_unit2_bn2 stage3_unit2_conv2 Convolution 3x3/1x1, 256 stage3_unit2_conv2->stage3_unit2_relu2 stage3_unit2_bn3_gamma stage3_unit2_bn3_gamma stage3_unit2_bn3_beta stage3_unit2_bn3_beta stage3_unit2_bn3_moving_mean stage3_unit2_bn3_moving_mean stage3_unit2_bn3_moving_var stage3_unit2_bn3_moving_var stage3_unit2_bn3 stage3_unit2_bn3 stage3_unit2_bn3->stage3_unit2_conv2 stage3_unit2_bn3->stage3_unit2_bn3_gamma stage3_unit2_bn3->stage3_unit2_bn3_beta stage3_unit2_bn3->stage3_unit2_bn3_moving_mean stage3_unit2_bn3->stage3_unit2_bn3_moving_var stage3_unit2_relu3 Activation relu stage3_unit2_relu3->stage3_unit2_bn3 stage3_unit2_conv3 Convolution 1x1/1x1, 1024 stage3_unit2_conv3->stage3_unit2_relu3 _plus8 _plus8 _plus8->_plus7 _plus8->stage3_unit2_conv3 stage3_unit3_bn1_gamma stage3_unit3_bn1_gamma stage3_unit3_bn1_beta stage3_unit3_bn1_beta stage3_unit3_bn1_moving_mean stage3_unit3_bn1_moving_mean stage3_unit3_bn1_moving_var stage3_unit3_bn1_moving_var stage3_unit3_bn1 stage3_unit3_bn1 stage3_unit3_bn1->_plus8 stage3_unit3_bn1->stage3_unit3_bn1_gamma stage3_unit3_bn1->stage3_unit3_bn1_beta stage3_unit3_bn1->stage3_unit3_bn1_moving_mean stage3_unit3_bn1->stage3_unit3_bn1_moving_var stage3_unit3_relu1 Activation relu stage3_unit3_relu1->stage3_unit3_bn1 stage3_unit3_conv1 Convolution 1x1/1x1, 256 stage3_unit3_conv1->stage3_unit3_relu1 stage3_unit3_bn2_gamma stage3_unit3_bn2_gamma stage3_unit3_bn2_beta stage3_unit3_bn2_beta stage3_unit3_bn2_moving_mean stage3_unit3_bn2_moving_mean stage3_unit3_bn2_moving_var stage3_unit3_bn2_moving_var stage3_unit3_bn2 stage3_unit3_bn2 stage3_unit3_bn2->stage3_unit3_conv1 stage3_unit3_bn2->stage3_unit3_bn2_gamma stage3_unit3_bn2->stage3_unit3_bn2_beta stage3_unit3_bn2->stage3_unit3_bn2_moving_mean stage3_unit3_bn2->stage3_unit3_bn2_moving_var stage3_unit3_relu2 Activation relu stage3_unit3_relu2->stage3_unit3_bn2 stage3_unit3_conv2 Convolution 3x3/1x1, 256 stage3_unit3_conv2->stage3_unit3_relu2 stage3_unit3_bn3_gamma stage3_unit3_bn3_gamma stage3_unit3_bn3_beta stage3_unit3_bn3_beta stage3_unit3_bn3_moving_mean stage3_unit3_bn3_moving_mean stage3_unit3_bn3_moving_var stage3_unit3_bn3_moving_var stage3_unit3_bn3 stage3_unit3_bn3 stage3_unit3_bn3->stage3_unit3_conv2 stage3_unit3_bn3->stage3_unit3_bn3_gamma stage3_unit3_bn3->stage3_unit3_bn3_beta stage3_unit3_bn3->stage3_unit3_bn3_moving_mean stage3_unit3_bn3->stage3_unit3_bn3_moving_var stage3_unit3_relu3 Activation relu stage3_unit3_relu3->stage3_unit3_bn3 stage3_unit3_conv3 Convolution 1x1/1x1, 1024 stage3_unit3_conv3->stage3_unit3_relu3 _plus9 _plus9 _plus9->_plus8 _plus9->stage3_unit3_conv3 stage3_unit4_bn1_gamma stage3_unit4_bn1_gamma stage3_unit4_bn1_beta stage3_unit4_bn1_beta stage3_unit4_bn1_moving_mean stage3_unit4_bn1_moving_mean stage3_unit4_bn1_moving_var stage3_unit4_bn1_moving_var stage3_unit4_bn1 stage3_unit4_bn1 stage3_unit4_bn1->_plus9 stage3_unit4_bn1->stage3_unit4_bn1_gamma stage3_unit4_bn1->stage3_unit4_bn1_beta stage3_unit4_bn1->stage3_unit4_bn1_moving_mean stage3_unit4_bn1->stage3_unit4_bn1_moving_var stage3_unit4_relu1 Activation relu stage3_unit4_relu1->stage3_unit4_bn1 stage3_unit4_conv1 Convolution 1x1/1x1, 256 stage3_unit4_conv1->stage3_unit4_relu1 stage3_unit4_bn2_gamma stage3_unit4_bn2_gamma stage3_unit4_bn2_beta stage3_unit4_bn2_beta stage3_unit4_bn2_moving_mean stage3_unit4_bn2_moving_mean stage3_unit4_bn2_moving_var stage3_unit4_bn2_moving_var stage3_unit4_bn2 stage3_unit4_bn2 stage3_unit4_bn2->stage3_unit4_conv1 stage3_unit4_bn2->stage3_unit4_bn2_gamma stage3_unit4_bn2->stage3_unit4_bn2_beta stage3_unit4_bn2->stage3_unit4_bn2_moving_mean stage3_unit4_bn2->stage3_unit4_bn2_moving_var stage3_unit4_relu2 Activation relu stage3_unit4_relu2->stage3_unit4_bn2 stage3_unit4_conv2 Convolution 3x3/1x1, 256 stage3_unit4_conv2->stage3_unit4_relu2 stage3_unit4_bn3_gamma stage3_unit4_bn3_gamma stage3_unit4_bn3_beta stage3_unit4_bn3_beta stage3_unit4_bn3_moving_mean stage3_unit4_bn3_moving_mean stage3_unit4_bn3_moving_var stage3_unit4_bn3_moving_var stage3_unit4_bn3 stage3_unit4_bn3 stage3_unit4_bn3->stage3_unit4_conv2 stage3_unit4_bn3->stage3_unit4_bn3_gamma stage3_unit4_bn3->stage3_unit4_bn3_beta stage3_unit4_bn3->stage3_unit4_bn3_moving_mean stage3_unit4_bn3->stage3_unit4_bn3_moving_var stage3_unit4_relu3 Activation relu stage3_unit4_relu3->stage3_unit4_bn3 stage3_unit4_conv3 Convolution 1x1/1x1, 1024 stage3_unit4_conv3->stage3_unit4_relu3 _plus10 _plus10 _plus10->_plus9 _plus10->stage3_unit4_conv3 stage3_unit5_bn1_gamma stage3_unit5_bn1_gamma stage3_unit5_bn1_beta stage3_unit5_bn1_beta stage3_unit5_bn1_moving_mean stage3_unit5_bn1_moving_mean stage3_unit5_bn1_moving_var stage3_unit5_bn1_moving_var stage3_unit5_bn1 stage3_unit5_bn1 stage3_unit5_bn1->_plus10 stage3_unit5_bn1->stage3_unit5_bn1_gamma stage3_unit5_bn1->stage3_unit5_bn1_beta stage3_unit5_bn1->stage3_unit5_bn1_moving_mean stage3_unit5_bn1->stage3_unit5_bn1_moving_var stage3_unit5_relu1 Activation relu stage3_unit5_relu1->stage3_unit5_bn1 stage3_unit5_conv1 Convolution 1x1/1x1, 256 stage3_unit5_conv1->stage3_unit5_relu1 stage3_unit5_bn2_gamma stage3_unit5_bn2_gamma stage3_unit5_bn2_beta stage3_unit5_bn2_beta stage3_unit5_bn2_moving_mean stage3_unit5_bn2_moving_mean stage3_unit5_bn2_moving_var stage3_unit5_bn2_moving_var stage3_unit5_bn2 stage3_unit5_bn2 stage3_unit5_bn2->stage3_unit5_conv1 stage3_unit5_bn2->stage3_unit5_bn2_gamma stage3_unit5_bn2->stage3_unit5_bn2_beta stage3_unit5_bn2->stage3_unit5_bn2_moving_mean stage3_unit5_bn2->stage3_unit5_bn2_moving_var stage3_unit5_relu2 Activation relu stage3_unit5_relu2->stage3_unit5_bn2 stage3_unit5_conv2 Convolution 3x3/1x1, 256 stage3_unit5_conv2->stage3_unit5_relu2 stage3_unit5_bn3_gamma stage3_unit5_bn3_gamma stage3_unit5_bn3_beta stage3_unit5_bn3_beta stage3_unit5_bn3_moving_mean stage3_unit5_bn3_moving_mean stage3_unit5_bn3_moving_var stage3_unit5_bn3_moving_var stage3_unit5_bn3 stage3_unit5_bn3 stage3_unit5_bn3->stage3_unit5_conv2 stage3_unit5_bn3->stage3_unit5_bn3_gamma stage3_unit5_bn3->stage3_unit5_bn3_beta stage3_unit5_bn3->stage3_unit5_bn3_moving_mean stage3_unit5_bn3->stage3_unit5_bn3_moving_var stage3_unit5_relu3 Activation relu stage3_unit5_relu3->stage3_unit5_bn3 stage3_unit5_conv3 Convolution 1x1/1x1, 1024 stage3_unit5_conv3->stage3_unit5_relu3 _plus11 _plus11 _plus11->_plus10 _plus11->stage3_unit5_conv3 stage3_unit6_bn1_gamma stage3_unit6_bn1_gamma stage3_unit6_bn1_beta stage3_unit6_bn1_beta stage3_unit6_bn1_moving_mean stage3_unit6_bn1_moving_mean stage3_unit6_bn1_moving_var stage3_unit6_bn1_moving_var stage3_unit6_bn1 stage3_unit6_bn1 stage3_unit6_bn1->_plus11 stage3_unit6_bn1->stage3_unit6_bn1_gamma stage3_unit6_bn1->stage3_unit6_bn1_beta stage3_unit6_bn1->stage3_unit6_bn1_moving_mean stage3_unit6_bn1->stage3_unit6_bn1_moving_var stage3_unit6_relu1 Activation relu stage3_unit6_relu1->stage3_unit6_bn1 stage3_unit6_conv1 Convolution 1x1/1x1, 256 stage3_unit6_conv1->stage3_unit6_relu1 stage3_unit6_bn2_gamma stage3_unit6_bn2_gamma stage3_unit6_bn2_beta stage3_unit6_bn2_beta stage3_unit6_bn2_moving_mean stage3_unit6_bn2_moving_mean stage3_unit6_bn2_moving_var stage3_unit6_bn2_moving_var stage3_unit6_bn2 stage3_unit6_bn2 stage3_unit6_bn2->stage3_unit6_conv1 stage3_unit6_bn2->stage3_unit6_bn2_gamma stage3_unit6_bn2->stage3_unit6_bn2_beta stage3_unit6_bn2->stage3_unit6_bn2_moving_mean stage3_unit6_bn2->stage3_unit6_bn2_moving_var stage3_unit6_relu2 Activation relu stage3_unit6_relu2->stage3_unit6_bn2 stage3_unit6_conv2 Convolution 3x3/1x1, 256 stage3_unit6_conv2->stage3_unit6_relu2 stage3_unit6_bn3_gamma stage3_unit6_bn3_gamma stage3_unit6_bn3_beta stage3_unit6_bn3_beta stage3_unit6_bn3_moving_mean stage3_unit6_bn3_moving_mean stage3_unit6_bn3_moving_var stage3_unit6_bn3_moving_var stage3_unit6_bn3 stage3_unit6_bn3 stage3_unit6_bn3->stage3_unit6_conv2 stage3_unit6_bn3->stage3_unit6_bn3_gamma stage3_unit6_bn3->stage3_unit6_bn3_beta stage3_unit6_bn3->stage3_unit6_bn3_moving_mean stage3_unit6_bn3->stage3_unit6_bn3_moving_var stage3_unit6_relu3 Activation relu stage3_unit6_relu3->stage3_unit6_bn3 stage3_unit6_conv3 Convolution 1x1/1x1, 1024 stage3_unit6_conv3->stage3_unit6_relu3 _plus12 _plus12 _plus12->_plus11 _plus12->stage3_unit6_conv3 stage4_unit1_bn1_gamma stage4_unit1_bn1_gamma stage4_unit1_bn1_beta stage4_unit1_bn1_beta stage4_unit1_bn1_moving_mean stage4_unit1_bn1_moving_mean stage4_unit1_bn1_moving_var stage4_unit1_bn1_moving_var stage4_unit1_bn1 stage4_unit1_bn1 stage4_unit1_bn1->_plus12 stage4_unit1_bn1->stage4_unit1_bn1_gamma stage4_unit1_bn1->stage4_unit1_bn1_beta stage4_unit1_bn1->stage4_unit1_bn1_moving_mean stage4_unit1_bn1->stage4_unit1_bn1_moving_var stage4_unit1_relu1 Activation relu stage4_unit1_relu1->stage4_unit1_bn1 stage4_unit1_conv1 Convolution 1x1/1x1, 512 stage4_unit1_conv1->stage4_unit1_relu1 stage4_unit1_bn2_gamma stage4_unit1_bn2_gamma stage4_unit1_bn2_beta stage4_unit1_bn2_beta stage4_unit1_bn2_moving_mean stage4_unit1_bn2_moving_mean stage4_unit1_bn2_moving_var stage4_unit1_bn2_moving_var stage4_unit1_bn2 stage4_unit1_bn2 stage4_unit1_bn2->stage4_unit1_conv1 stage4_unit1_bn2->stage4_unit1_bn2_gamma stage4_unit1_bn2->stage4_unit1_bn2_beta stage4_unit1_bn2->stage4_unit1_bn2_moving_mean stage4_unit1_bn2->stage4_unit1_bn2_moving_var stage4_unit1_relu2 Activation relu stage4_unit1_relu2->stage4_unit1_bn2 stage4_unit1_conv2 Convolution 3x3/2x2, 512 stage4_unit1_conv2->stage4_unit1_relu2 stage4_unit1_bn3_gamma stage4_unit1_bn3_gamma stage4_unit1_bn3_beta stage4_unit1_bn3_beta stage4_unit1_bn3_moving_mean stage4_unit1_bn3_moving_mean stage4_unit1_bn3_moving_var stage4_unit1_bn3_moving_var stage4_unit1_bn3 stage4_unit1_bn3 stage4_unit1_bn3->stage4_unit1_conv2 stage4_unit1_bn3->stage4_unit1_bn3_gamma stage4_unit1_bn3->stage4_unit1_bn3_beta stage4_unit1_bn3->stage4_unit1_bn3_moving_mean stage4_unit1_bn3->stage4_unit1_bn3_moving_var stage4_unit1_relu3 Activation relu stage4_unit1_relu3->stage4_unit1_bn3 stage4_unit1_conv3 Convolution 1x1/1x1, 2048 stage4_unit1_conv3->stage4_unit1_relu3 stage4_unit1_sc Convolution 1x1/2x2, 2048 stage4_unit1_sc->stage4_unit1_relu1 _plus13 _plus13 _plus13->stage4_unit1_conv3 _plus13->stage4_unit1_sc stage4_unit2_bn1_gamma stage4_unit2_bn1_gamma stage4_unit2_bn1_beta stage4_unit2_bn1_beta stage4_unit2_bn1_moving_mean stage4_unit2_bn1_moving_mean stage4_unit2_bn1_moving_var stage4_unit2_bn1_moving_var stage4_unit2_bn1 stage4_unit2_bn1 stage4_unit2_bn1->_plus13 stage4_unit2_bn1->stage4_unit2_bn1_gamma stage4_unit2_bn1->stage4_unit2_bn1_beta stage4_unit2_bn1->stage4_unit2_bn1_moving_mean stage4_unit2_bn1->stage4_unit2_bn1_moving_var stage4_unit2_relu1 Activation relu stage4_unit2_relu1->stage4_unit2_bn1 stage4_unit2_conv1 Convolution 1x1/1x1, 512 stage4_unit2_conv1->stage4_unit2_relu1 stage4_unit2_bn2_gamma stage4_unit2_bn2_gamma stage4_unit2_bn2_beta stage4_unit2_bn2_beta stage4_unit2_bn2_moving_mean stage4_unit2_bn2_moving_mean stage4_unit2_bn2_moving_var stage4_unit2_bn2_moving_var stage4_unit2_bn2 stage4_unit2_bn2 stage4_unit2_bn2->stage4_unit2_conv1 stage4_unit2_bn2->stage4_unit2_bn2_gamma stage4_unit2_bn2->stage4_unit2_bn2_beta stage4_unit2_bn2->stage4_unit2_bn2_moving_mean stage4_unit2_bn2->stage4_unit2_bn2_moving_var stage4_unit2_relu2 Activation relu stage4_unit2_relu2->stage4_unit2_bn2 stage4_unit2_conv2 Convolution 3x3/1x1, 512 stage4_unit2_conv2->stage4_unit2_relu2 stage4_unit2_bn3_gamma stage4_unit2_bn3_gamma stage4_unit2_bn3_beta stage4_unit2_bn3_beta stage4_unit2_bn3_moving_mean stage4_unit2_bn3_moving_mean stage4_unit2_bn3_moving_var stage4_unit2_bn3_moving_var stage4_unit2_bn3 stage4_unit2_bn3 stage4_unit2_bn3->stage4_unit2_conv2 stage4_unit2_bn3->stage4_unit2_bn3_gamma stage4_unit2_bn3->stage4_unit2_bn3_beta stage4_unit2_bn3->stage4_unit2_bn3_moving_mean stage4_unit2_bn3->stage4_unit2_bn3_moving_var stage4_unit2_relu3 Activation relu stage4_unit2_relu3->stage4_unit2_bn3 stage4_unit2_conv3 Convolution 1x1/1x1, 2048 stage4_unit2_conv3->stage4_unit2_relu3 _plus14 _plus14 _plus14->_plus13 _plus14->stage4_unit2_conv3 stage4_unit3_bn1_gamma stage4_unit3_bn1_gamma stage4_unit3_bn1_beta stage4_unit3_bn1_beta stage4_unit3_bn1_moving_mean stage4_unit3_bn1_moving_mean stage4_unit3_bn1_moving_var stage4_unit3_bn1_moving_var stage4_unit3_bn1 stage4_unit3_bn1 stage4_unit3_bn1->_plus14 stage4_unit3_bn1->stage4_unit3_bn1_gamma stage4_unit3_bn1->stage4_unit3_bn1_beta stage4_unit3_bn1->stage4_unit3_bn1_moving_mean stage4_unit3_bn1->stage4_unit3_bn1_moving_var stage4_unit3_relu1 Activation relu stage4_unit3_relu1->stage4_unit3_bn1 stage4_unit3_conv1 Convolution 1x1/1x1, 512 stage4_unit3_conv1->stage4_unit3_relu1 stage4_unit3_bn2_gamma stage4_unit3_bn2_gamma stage4_unit3_bn2_beta stage4_unit3_bn2_beta stage4_unit3_bn2_moving_mean stage4_unit3_bn2_moving_mean stage4_unit3_bn2_moving_var stage4_unit3_bn2_moving_var stage4_unit3_bn2 stage4_unit3_bn2 stage4_unit3_bn2->stage4_unit3_conv1 stage4_unit3_bn2->stage4_unit3_bn2_gamma stage4_unit3_bn2->stage4_unit3_bn2_beta stage4_unit3_bn2->stage4_unit3_bn2_moving_mean stage4_unit3_bn2->stage4_unit3_bn2_moving_var stage4_unit3_relu2 Activation relu stage4_unit3_relu2->stage4_unit3_bn2 stage4_unit3_conv2 Convolution 3x3/1x1, 512 stage4_unit3_conv2->stage4_unit3_relu2 stage4_unit3_bn3_gamma stage4_unit3_bn3_gamma stage4_unit3_bn3_beta stage4_unit3_bn3_beta stage4_unit3_bn3_moving_mean stage4_unit3_bn3_moving_mean stage4_unit3_bn3_moving_var stage4_unit3_bn3_moving_var stage4_unit3_bn3 stage4_unit3_bn3 stage4_unit3_bn3->stage4_unit3_conv2 stage4_unit3_bn3->stage4_unit3_bn3_gamma stage4_unit3_bn3->stage4_unit3_bn3_beta stage4_unit3_bn3->stage4_unit3_bn3_moving_mean stage4_unit3_bn3->stage4_unit3_bn3_moving_var stage4_unit3_relu3 Activation relu stage4_unit3_relu3->stage4_unit3_bn3 stage4_unit3_conv3 Convolution 1x1/1x1, 2048 stage4_unit3_conv3->stage4_unit3_relu3 _plus15 _plus15 _plus15->_plus14 _plus15->stage4_unit3_conv3 bn1_gamma bn1_gamma bn1_beta bn1_beta bn1_moving_mean bn1_moving_mean bn1_moving_var bn1_moving_var bn1 bn1 bn1->_plus15 bn1->bn1_gamma bn1->bn1_beta bn1->bn1_moving_mean bn1->bn1_moving_var activation0 Activation relu activation0->bn1 convolution0 Convolution 3x3/1x1, 5 convolution0->activation0 abs0 abs0 abs0->convolution0 _plusscalar0 _plusscalar0 _plusscalar0->abs0 _div0 _div0 _div0->convolution0 _div0->_plusscalar0 logit logit logit->_div0 reshape0 reshape0 reshape0->logit _plusscalar1 _plusscalar1 _plusscalar1->reshape0 _divscalar0 _divscalar0 _divscalar0->_plusscalar1 split1 split1 split1->_divscalar0 softmax_label softmax_label reshape1 reshape1 reshape1->softmax_label split0 split0 split0->reshape1 _mulscalar0->split0 _rminusscalar0 _rminusscalar0 _rminusscalar0->split0 _divscalar1->_rminusscalar0 _mul1 _mul1 _mul1->_plus0 _mul1->split1 _mul0 _mul0 _mul0->_plus0 _mul0->split0 linearregressionoutput0 linearregressionoutput0 linearregressionoutput0->_mul1 linearregressionoutput0->_mul0 makeloss0 makeloss0 makeloss0->linearregressionoutput0 blockgrad0 blockgrad0 blockgrad0->logit

In [3]:
# get some input 
train_data = mx.io.ImageRecordIter(path_imgrec='cat.rec',
                                 data_shape=(3,224,224),
                                 label_width=7*7*5, 
                                 batch_size=1,)
val_data = mx.io.ImageRecordIter(path_imgrec='cat_small.rec',
                                 data_shape=(3,224,224),
                                 label_width=7*7*5, 
                                 batch_size=1,)

In [4]:
mod = mx.mod.Module(symbol=sym, context=mx.gpu(0))

In [5]:
mod.bind(train_data.provide_data, train_data.provide_label)

In [6]:
mod.init_params(allow_missing=True, arg_params=args_params, aux_params=aux_params, 
                initializer=mx.init.Xavier(magnitude=2,rnd_type='gaussian',factor_type='in'))

In [7]:
out = mod.predict(eval_data=train_data, num_batch=1)

In [9]:
out


Out[9]:
[<NDArray 1x49x1 @gpu(0)>, <NDArray 1x5x7x7 @gpu(0)>]

In [ ]:



Help on function transpose in module mxnet.symbol:

transpose(*args, **kwargs)
    Permutes the dimensions of an array.
    
    Examples::
    
      x = [[ 1, 2],
           [ 3, 4]]
    
      transpose(x) = [[ 1.,  3.],
                      [ 2.,  4.]]
    
      x = [[[ 1.,  2.],
            [ 3.,  4.]],
    
           [[ 5.,  6.],
            [ 7.,  8.]]]
    
      transpose(x) = [[[ 1.,  5.],
                       [ 3.,  7.]],
    
                      [[ 2.,  6.],
                       [ 4.,  8.]]]
    
      transpose(x, axes=(1,0,2)) = [[[ 1.,  2.],
                                     [ 5.,  6.]],
    
                                    [[ 3.,  4.],
                                     [ 7.,  8.]]]
    
    
    Defined in src/operator/tensor/matrix_op.cc:L168
    
    Parameters
    ----------
    data : Symbol
        Source input
    axes : Shape(tuple), optional, default=()
        Target axis order. By default the axes will be inverted.
    
    name : string, optional.
        Name of the resulting symbol.
    
    Returns
    -------
    Symbol
        The result symbol.