diff --git a/Classification/cnns/README.md b/Classification/cnns/README.md
index 3bd7aa2..76b4b68 100644
--- a/Classification/cnns/README.md
+++ b/Classification/cnns/README.md
@@ -568,8 +568,10 @@ Class: tiger, Panthera tigris; score: 0.8112028241157532
 
 #### 如何生成 ONNX 模型
 
+
 **步骤一：指定模型路径**  
 
+
 首先指定待转换的OneFlow模型路径，然后指定转换后的ONNX模型存放路径，例如示例中：
 
 ```python
@@ -596,7 +598,47 @@ onnx_model = oneflow_to_onnx(InferenceNet, flow_weights_path, onnx_model_dir, ex
 
 生成 ONNX 模型之后可以使用 ONNX Runtime 运行 ONNX 模型，以验证 OneFlow 模型和 ONNX 模型能够在相同的输入下产生相同的结果。相应的代码在 resnet\_to\_onnx.py 的 `check_equality`。
 
-#### 训练AlexNet
+
+## 训练 Res2Net50
+Res2Net源于论文：[Res2Net: A New Multi-scale Backbone Architecture](https://arxiv.org/pdf/1904.01169.pdf)，是基于ResNet网络改进的，多尺度的卷积神经网络，其和ResNet主要的不点在于 bottleneck处：
+
+<div align="center">
+    <img src="data/res2net.jpg" align='center'/>
+</div>
+
+此结构称为Res2Net块，可以将Res2Net块插入经典CNN网络如：ResNet，ResNeXt，BigLittleNet和DLA中以提高准确率。
+训练脚本如下：
+```shell
+#Please change $DATA_ROOT  to your own data root.
+python3 of_cnn_train_val.py \
+     --train_data_dir=$DATA_ROOT/train \
+     --train_data_part_num=256 \
+     --val_data_dir=$DATA_ROOT/validation \
+     --val_data_part_num=256 \
+     --num_nodes=1 \
+     --gpu_num_per_node=8 \
+     --optimizer="sgd" \
+     --momentum=0.875 \
+     --lr_decay="cosine" \
+     --label_smoothing=0.1 \
+     --learning_rate=0.512 \
+     --loss_print_every_n_iter=100 \
+     --batch_size_per_device=64 \
+     --val_batch_size_per_device=50 \
+     --use_fp16=True \
+     --channel_last=False \
+     --fuse_bn_relu=True \
+     --fuse_bn_add_relu=True \
+     --nccl_fusion_threshold_mb=32 \
+     --nccl_fusion_max_ops=48 \
+     --gpu_image_decoder=False \
+     --num_epoch=100  \
+     --model="res2net50"
+```
+
+我们使用了和ResNet50一致的训练参数，经过93epoch的训练后，Res2Net模型精度达到了：Top1 acc:77.852%，点此下载[模型](https://oneflow-public.oss-cn-beijing.aliyuncs.com/model_zoo/res2net50_of_best_model_val_top1_77852.zip)。
+
+## 训练AlexNet
 
 ```
 #Please change $DATA_ROOT this to your own data root.
@@ -622,7 +664,7 @@ python3 of_cnn_train_val.py \
 
 
 
-#### 训练 VGG-16
+## 训练 VGG-16
 ```
 #Please change $DATA_ROOT this to your own data root.
 python3 cnn_benchmark/of_cnn_train_val.py \
diff --git a/Classification/cnns/data/res2net.jpg b/Classification/cnns/data/res2net.jpg
new file mode 100644
index 0000000..e5a815d
Binary files /dev/null and b/Classification/cnns/data/res2net.jpg differ
diff --git a/Classification/cnns/of_cnn_evaluate.py b/Classification/cnns/of_cnn_evaluate.py
index 286f25b..239888b 100644
--- a/Classification/cnns/of_cnn_evaluate.py
+++ b/Classification/cnns/of_cnn_evaluate.py
@@ -30,6 +30,7 @@
 import oneflow as flow
 import vgg_model
 import resnet_model
+import res2net_model
 import resnext_model
 import alexnet_model
 import mobilenet_v2_model
@@ -42,6 +43,7 @@
 
 
 model_dict = {
+    "res2net50": res2net_model.res2net50,
     "resnet50": resnet_model.resnet50,
     "vgg": vgg_model.vgg16bn,
     "alexnet": alexnet_model.alexnet,
diff --git a/Classification/cnns/of_cnn_train_val.py b/Classification/cnns/of_cnn_train_val.py
index ba84865..38bbc96 100755
--- a/Classification/cnns/of_cnn_train_val.py
+++ b/Classification/cnns/of_cnn_train_val.py
@@ -22,6 +22,7 @@
 from util import Snapshot, Summary, InitNodes, Metric
 from job_function_util import get_train_config, get_val_config
 import resnet_model
+import res2net_model
 import resnext_model
 import vgg_model
 import alexnet_model
@@ -42,6 +43,7 @@
 
 model_dict = {
     "resnet50": resnet_model.resnet50,
+    "res2net50": res2net_model.res2net50,
     "vgg": vgg_model.vgg16bn,
     "alexnet": alexnet_model.alexnet,
     "inceptionv3": inception_model.inceptionv3,
diff --git a/Classification/cnns/res2net_model.py b/Classification/cnns/res2net_model.py
new file mode 100644
index 0000000..bd7bc0d
--- /dev/null
+++ b/Classification/cnns/res2net_model.py
@@ -0,0 +1,316 @@
+"""
+Copyright 2020 The OneFlow Authors. All rights reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+
+import oneflow as flow
+
+
+class Res2netBuilder(object):
+    def __init__(self, weight_regularizer, trainable=True, training=True, channel_last=False, fuse_bn_relu=True,
+                 fuse_bn_add_relu=True):
+        self.data_format = "NHWC" if channel_last else "NCHW"
+        self.weight_initializer = flow.variance_scaling_initializer(2, 'fan_in', 'random_normal',
+                                                                    data_format=self.data_format)
+        self.weight_regularizer = weight_regularizer
+        self.trainable = trainable
+        self.training = training
+        self.fuse_bn_relu = fuse_bn_relu
+        self.fuse_bn_add_relu = fuse_bn_add_relu
+        self.baseWidth = 26
+        self.scale = 4
+        if self.scale == 1:
+            self.nums = 1
+        else:
+            self.nums = self.scale - 1
+        
+
+    def _conv2d(
+            self,
+            name,
+            input,
+            filters,
+            kernel_size,
+            strides=1,
+            padding="SAME",
+            dilations=1,
+    ):
+        # There are different shapes of weight metric between 'NCHW' and 'NHWC' mode
+        if self.data_format == "NHWC":
+            shape = (filters, kernel_size, kernel_size, input.shape[3])
+        else:
+            shape = (filters, input.shape[1], kernel_size, kernel_size)
+        weight = flow.get_variable(
+            name + "-weight",
+            shape=shape,
+            dtype=input.dtype,
+            initializer=self.weight_initializer,
+            regularizer=self.weight_regularizer,
+            model_name="weight",
+            trainable=self.trainable,
+        )
+
+        return flow.nn.conv2d(input, weight, strides, padding, self.data_format, dilations, name=name)
+
+    def _batch_norm(self, inputs, name=None, last=False):
+        initializer = flow.zeros_initializer() if last else flow.ones_initializer()
+        axis = 1
+        if self.data_format == "NHWC":
+            axis = 3
+        return flow.layers.batch_normalization(
+            inputs=inputs,
+            axis=axis,
+            momentum=0.9,  # 97,
+            epsilon=1e-5,
+            center=True,
+            scale=True,
+            trainable=self.trainable,
+            training=self.training,
+            gamma_initializer=initializer,
+            moving_variance_initializer=initializer,
+            gamma_regularizer=self.weight_regularizer,
+            beta_regularizer=self.weight_regularizer,
+            name=name,
+        )
+
+    def _batch_norm_relu(self, inputs, name=None, last=False):
+        if self.fuse_bn_relu:
+            initializer = flow.zeros_initializer() if last else flow.ones_initializer()
+            axis = 1
+            if self.data_format == "NHWC":
+                axis = 3
+            return flow.layers.batch_normalization_relu(
+                inputs=inputs,
+                axis=axis,
+                momentum=0.9,
+                epsilon=1e-5,
+                center=True,
+                scale=True,
+                trainable=self.trainable,
+                training=self.training,
+                gamma_initializer=initializer,
+                moving_variance_initializer=initializer,
+                gamma_regularizer=self.weight_regularizer,
+                beta_regularizer=self.weight_regularizer,
+                name=name + "_bn_relu",
+            )
+        else:
+            return flow.nn.relu(self._batch_norm(inputs, name + "_bn", last=last))
+
+    def _batch_norm_add_relu(self, inputs, addend, name=None, last=False):
+        if self.fuse_bn_add_relu:
+            initializer = flow.zeros_initializer() if last else flow.ones_initializer()
+            axis = 1
+            if self.data_format == "NHWC":
+                axis = 3
+            return flow.layers.batch_normalization_add_relu(
+                inputs=inputs,
+                addend=addend,
+                axis=axis,
+                momentum=0.9,
+                epsilon=1e-5,
+                center=True,
+                scale=True,
+                trainable=self.trainable,
+                training=self.training,
+                gamma_initializer=initializer,
+                moving_variance_initializer=initializer,
+                gamma_regularizer=self.weight_regularizer,
+                beta_regularizer=self.weight_regularizer,
+                name=name + "_bn_add_relu",
+            )
+        else:
+            return flow.nn.relu(self._batch_norm(inputs, name + "_bn", last=last) + addend)
+
+    def conv2d_affine(self, input, name, filters, kernel_size, strides):
+        # input data_format must be NCHW, cannot check now
+        padding = "SAME" if strides > 1 or kernel_size > 1 else "VALID"
+        output = self._conv2d(name, input, filters, kernel_size, strides, padding)
+        return output
+
+    def bottleneck_res2net(self, input, block_name, filters, filters_inner, stride, stype="normal"):
+        a = self.conv2d_affine(
+            input, block_name + "_branch2a", filters_inner, 1, 1)
+        x = self._batch_norm_relu(a, block_name + "_branch2a")
+
+        spx = []
+        # x = flow.concat(inputs=[spx[0], spx[1], spx[2], spx[3]], axis=1)
+        split_num = int(x.shape[1] / self.scale)
+        for i in range(self.scale):
+            split_tensor = flow.slice(x, begin=[None, i * split_num, None, None], size=[None, split_num, None, None])
+            spx.append(split_tensor)
+
+        for i in range(self.nums):
+            if i == 0 or stype == 'stage':
+                sp_tmp = spx[i]
+            else:
+                sp_tmp = sp_tmp + spx[i]
+            sp = self.conv2d_affine(sp_tmp, block_name + "_branch2b_"+str(i), filters, 3, 1)
+            sp = self._batch_norm_relu(sp, block_name + "_branch2b_"+str(i))
+            if i == 0:
+                out = sp
+            else:
+                out = flow.concat(inputs=[x, sp], axis=1)
+        if stype == 'normal':
+            out = flow.concat(inputs=[out, spx[self.nums]], axis=1)
+        elif stype == 'stage':
+            out = flow.nn.avg_pool2d(
+                spx[self.nums], ksize=3, strides=stride, padding="SAME",
+                data_format=self.data_format, name=block_name+"bottleneck_avg_pool",
+            )
+
+        z = self.conv2d_affine(out, block_name + "_branch2c", filters, 1, 1)
+        return z
+
+
+    def residual_block(self, input, block_name, filters, filters_inner, strides_init):
+        if strides_init != 1 or block_name == "res2_0":
+            shortcut = self.conv2d_affine(
+                input, block_name + "_branch1", filters, 1, strides_init
+            )
+            shortcut = self._batch_norm(shortcut, block_name + "_branch1_bn")
+            stride = 1
+            stype="stage"
+        else:
+            shortcut = input
+            stride = 2
+            stype="normal"
+
+        bottleneck = self.bottleneck_res2net(
+            input, block_name, filters, filters_inner, strides_init, stype
+        )
+
+        output = self._batch_norm_add_relu(bottleneck, shortcut, block_name + "_branch2c", last=True)
+        return output
+
+
+    def residual_stage(self, input, stage_name, counts, filters, filters_inner, stride_init=2):
+        output = input
+        for i in range(counts):
+            block_name = "%s_%d" % (stage_name, i)
+            output = self.residual_block(
+                output, block_name, filters, filters_inner, stride_init if i == 0 else 1
+            )
+        return output
+
+    def resnet_conv_x_body(self, input, resnet_blocks):
+        output = input
+        for i, (counts, filters, filters_inner) in enumerate(resnet_blocks):
+            stage_name = "res%d" % (i + 2)
+            output = self.residual_stage(
+                output, stage_name, counts, filters, filters_inner, 1 if i == 0 else 2
+            )
+
+        return output
+
+    def resnet_stem(self, input):
+        conv1 = self._conv2d("conv1", input, 64, 7, 2)
+        conv1_bn = self._batch_norm_relu(conv1, "conv1")
+        pool1 = flow.nn.max_pool2d(
+            conv1_bn, ksize=3, strides=2, padding="SAME", data_format=self.data_format, name="pool1",
+        )
+        return pool1
+
+
+def res2net50(images, args, trainable=True, training=True):
+    weight_regularizer = flow.regularizers.l2(args.wd) if args.wd > 0.0 and args.wd < 1.0 else None
+    builder = Res2netBuilder(weight_regularizer, trainable, training, args.channel_last, args.fuse_bn_relu,
+                            args.fuse_bn_add_relu)
+    block_counts = [3, 4, 6, 3]
+    block_filters = [256, 512, 1024, 2048]
+    block_filters_inner = [64, 128, 256, 512]
+    resnet_blocks = zip(block_counts, block_filters, block_filters_inner)
+
+    if args.pad_output:
+        if args.channel_last:
+            paddings = ((0, 0), (0, 0), (0, 0), (0, 1))
+        else:
+            paddings = ((0, 0), (0, 1), (0, 0), (0, 0))
+        images = flow.pad(images, paddings=paddings)
+    with flow.scope.namespace("Resnet"):
+        stem = builder.resnet_stem(images)
+        body = builder.resnet_conv_x_body(stem, resnet_blocks)
+        pool5 = flow.nn.avg_pool2d(
+            body, ksize=7, strides=1, padding="VALID", data_format=builder.data_format, name="pool5",
+        )
+        fc1001 = flow.layers.dense(
+            flow.reshape(pool5, (pool5.shape[0], -1)),
+            units=1000,
+            use_bias=True,
+            kernel_initializer=flow.variance_scaling_initializer(2, 'fan_in', 'random_normal'),
+            bias_initializer=flow.zeros_initializer(),
+            kernel_regularizer=weight_regularizer,
+            bias_regularizer=weight_regularizer,
+            trainable=trainable,
+            name="fc1001",
+        )
+    return fc1001
+
+
+def res2net18(images, args, trainable=True, training=True):
+    weight_regularizer = flow.regularizers.l2(args.wd) if args.wd > 0.0 and args.wd < 1.0 else None
+    builder = Res2netBuilder(weight_regularizer, trainable, training, args.channel_last, args.fuse_bn_relu,
+                            args.fuse_bn_add_relu)
+    block_counts = [2, 2, 2, 2]
+    block_filters = [64, 128, 256, 512]
+    block_filters_inner = [64, 128, 256, 512]
+    resnet_blocks = zip(block_counts, block_filters, block_filters_inner)
+
+    if args.pad_output:
+        if args.channel_last:
+            paddings = ((0, 0), (0, 0), (0, 0), (0, 1))
+        else:
+            paddings = ((0, 0), (0, 1), (0, 0), (0, 0))
+        images = flow.pad(images, paddings=paddings)
+    with flow.scope.namespace("Resnet"):
+        stem = builder.resnet_stem(images)
+        body = builder.resnet_conv_x_body(stem, resnet_blocks)
+        pool5 = flow.nn.avg_pool2d(
+            body, ksize=7, strides=1, padding="VALID", data_format=builder.data_format, name="pool5",
+        )
+        fc1001 = flow.layers.dense(
+            flow.reshape(pool5, (pool5.shape[0], -1)),
+            units=1000,
+            use_bias=True,
+            kernel_initializer=flow.variance_scaling_initializer(2, 'fan_in', 'random_normal'),
+            bias_initializer=flow.zeros_initializer(),
+            kernel_regularizer=weight_regularizer,
+            bias_regularizer=weight_regularizer,
+            trainable=trainable,
+            name="fc1001",
+        )
+    return fc1001
+
+
+import numpy as np
+import config as configs
+import oneflow.typing as tp
+
+parser = configs.get_parser()
+args = parser.parse_args()
+
+
+@flow.global_function(type="predict")
+def test_job(
+        images: tp.Numpy.Placeholder((32, 3, 224, 224), dtype=flow.float),
+        labels: tp.Numpy.Placeholder((32,), dtype=flow.int32)) -> tp.Numpy:
+    output = res2net50(images, args)
+    # print("images.shape, labels.shape, output.shape:", images.shape, labels.shape, output.shape)
+    return output
+
+
+if __name__ == '__main__':
+    images = np.random.uniform(-10, 10, (32, 1, 224, 224)).astype(np.float32)
+    labels = np.random.randint(-10, 10, (32,)).astype(np.int32)
+    output = test_job(images, labels)