More resnet models (#208)

* add ResNet50 model * add resnet to the models list for testing * fix docctsrings * add Resnet101, Resnet152, and blocks for v2 * add Resnet_v2 models * add tests for resnets
2023-05-24 01:06:51 +05:30 · 2023-05-24 01:06:51 +05:30 · 090112323c
commit 090112323c
parent d5493319b8
3 changed files with 399 additions and 0 deletions
--- a/keras_core/applications/applications_test.py
+++ b/keras_core/applications/applications_test.py
@ -15,6 +15,7 @@ from keras_core.applications import mobilenet_v2
 from keras_core.applications import mobilenet_v3
 from keras_core.applications import nasnet
 from keras_core.applications import resnet
 from keras_core.applications import resnet_v2
 from keras_core.applications import vgg16
 from keras_core.applications import vgg19
 from keras_core.applications import xception
@ -72,6 +73,11 @@ MODEL_LIST = [
    (nasnet.NASNetLarge, 4032, nasnet),
    # resnet
    (resnet.ResNet50, 2048, resnet),
    (resnet.ResNet101, 2048, resnet),
    (resnet.ResNet152, 2048, resnet),
    (resnet_v2.ResNet50V2, 2048, resnet_v2),
    (resnet_v2.ResNet101V2, 2048, resnet_v2),
    (resnet_v2.ResNet152V2, 2048, resnet_v2),
 ]
 # Add names for `named_parameters`.
 MODEL_LIST = [(e[0].__name__, *e) for e in MODEL_LIST]
--- a/keras_core/applications/resnet.py
+++ b/keras_core/applications/resnet.py
@ -16,6 +16,34 @@ WEIGHTS_HASHES = {
        "2cb95161c43110f7111970584f804107",
        "4d473c1dd8becc155b73f8504c6f6626",
    ),
    "resnet101": (
        "f1aeb4b969a6efcfb50fad2f0c20cfc5",
        "88cf7a10940856eca736dc7b7e228a21",
    ),
    "resnet152": (
        "100835be76be38e30d865e96f2aaae62",
        "ee4c566cf9a93f14d82f913c2dc6dd0c",
    ),
    "resnet50v2": (
        "3ef43a0b657b3be2300d5770ece849e0",
        "fac2f116257151a9d068a22e544a4917",
    ),
    "resnet101v2": (
        "6343647c601c52e1368623803854d971",
        "c0ed64b8031c3730f411d2eb4eea35b5",
    ),
    "resnet152v2": (
        "a49b44d1979771252814e80f8ec446f9",
        "ed17cf2e0169df9d443503ef94b23b33",
    ),
    "resnext50": (
        "67a5b30d522ed92f75a1f16eef299d1a",
        "62527c363bdd9ec598bed41947b379fc",
    ),
    "resnext101": (
        "34fb605428fcc7aa4d62f44404c11509",
        "0f678c91647380debd923963594981b3",
    ),
 }
@ -267,6 +295,92 @@ def stack_residual_blocks_v1(x, filters, blocks, stride1=2, name=None):
    return x
 def residual_block_v2(
    x, filters, kernel_size=3, stride=1, conv_shortcut=False, name=None
 ):
    """A residual block for ResNet*_v2.
    Args:
        x: Input tensor.
        filters: No of filters in the bottleneck layer.
        kernel_size: Kernel size of the bottleneck layer. Defaults to 3
        stride: Stride of the first layer. Defaults to 1
        conv_shortcut: Use convolution shortcut if `True`, otherwise
            use identity shortcut. Defaults to `True`
        name(optional): Name of the block
    Returns:
        Output tensor for the residual block.
    """
    if backend.image_data_format() == "channels_last":
        bn_axis = 3
    else:
        bn_axis = 1
    preact = layers.BatchNormalization(
        axis=bn_axis, epsilon=1.001e-5, name=name + "_preact_bn"
    )(x)
    preact = layers.Activation("relu", name=name + "_preact_relu")(preact)
    if conv_shortcut:
        shortcut = layers.Conv2D(
            4 * filters, 1, strides=stride, name=name + "_0_conv"
        )(preact)
    else:
        shortcut = (
            layers.MaxPooling2D(1, strides=stride)(x) if stride > 1 else x
        )
    x = layers.Conv2D(
        filters, 1, strides=1, use_bias=False, name=name + "_1_conv"
    )(preact)
    x = layers.BatchNormalization(
        axis=bn_axis, epsilon=1.001e-5, name=name + "_1_bn"
    )(x)
    x = layers.Activation("relu", name=name + "_1_relu")(x)
    x = layers.ZeroPadding2D(padding=((1, 1), (1, 1)), name=name + "_2_pad")(x)
    x = layers.Conv2D(
        filters,
        kernel_size,
        strides=stride,
        use_bias=False,
        name=name + "_2_conv",
    )(x)
    x = layers.BatchNormalization(
        axis=bn_axis, epsilon=1.001e-5, name=name + "_2_bn"
    )(x)
    x = layers.Activation("relu", name=name + "_2_relu")(x)
    x = layers.Conv2D(4 * filters, 1, name=name + "_3_conv")(x)
    x = layers.Add(name=name + "_out")([shortcut, x])
    return x
 def stack_residual_blocks_v2(x, filters, blocks, stride1=2, name=None):
    """A set of stacked residual blocks.
    Args:
        x: Input tensor.
        filters: Number of filters in the bottleneck layer in a block.
        blocks: Number of blocks in the stacked blocks.
        stride1: Stride of the first layer in the first block. Defaults to 2.
        name: Stack label.
    Returns:
        Output tensor for the stacked blocks.
    """
    x = residual_block_v2(x, filters, conv_shortcut=True, name=name + "_block1")
    for i in range(2, blocks):
        x = residual_block_v2(x, filters, name=name + "_block" + str(i))
    x = residual_block_v2(
        x, filters, stride=stride1, name=name + "_block" + str(blocks)
    )
    return x
@keras_core_export(
    [
        "keras_core.applications.resnet50.ResNet50",
@ -306,6 +420,82 @@ def ResNet50(
    )
@keras_core_export(
    [
        "keras_core.applications.resnet.ResNet101",
        "keras_core.applications.ResNet101",
    ]
 )
 def ResNet101(
    include_top=True,
    weights="imagenet",
    input_tensor=None,
    input_shape=None,
    pooling=None,
    classes=1000,
    classifier_activation="softmax",
 ):
    """Instantiates the ResNet101 architecture."""
    def stack_fn(x):
        x = stack_residual_blocks_v1(x, 64, 3, stride1=1, name="conv2")
        x = stack_residual_blocks_v1(x, 128, 4, name="conv3")
        x = stack_residual_blocks_v1(x, 256, 23, name="conv4")
        return stack_residual_blocks_v1(x, 512, 3, name="conv5")
    return ResNet(
        stack_fn,
        False,
        True,
        "resnet101",
        include_top,
        weights,
        input_tensor,
        input_shape,
        pooling,
        classes,
        classifier_activation=classifier_activation,
    )
@keras_core_export(
    [
        "keras_core.applications.resnet.ResNet152",
        "keras_core.applications.ResNet152",
    ]
 )
 def ResNet152(
    include_top=True,
    weights="imagenet",
    input_tensor=None,
    input_shape=None,
    pooling=None,
    classes=1000,
    classifier_activation="softmax",
 ):
    """Instantiates the ResNet152 architecture."""
    def stack_fn(x):
        x = stack_residual_blocks_v1(x, 64, 3, stride1=1, name="conv2")
        x = stack_residual_blocks_v1(x, 128, 8, name="conv3")
        x = stack_residual_blocks_v1(x, 256, 36, name="conv4")
        return stack_residual_blocks_v1(x, 512, 3, name="conv5")
    return ResNet(
        stack_fn,
        False,
        True,
        "resnet152",
        include_top,
        weights,
        input_tensor,
        input_shape,
        pooling,
        classes,
        classifier_activation=classifier_activation,
    )
@keras_core_export(
    [
        "keras_core.applications.resnet50.preprocess_input",
@ -390,3 +580,5 @@ Returns:
 """
 setattr(ResNet50, "__doc__", ResNet50.__doc__ + DOC)
 setattr(ResNet101, "__doc__", ResNet101.__doc__ + DOC)
 setattr(ResNet152, "__doc__", ResNet152.__doc__ + DOC)
--- a/keras_core/applications/resnet_v2.py
+++ b/keras_core/applications/resnet_v2.py
@ -0,0 +1,201 @@
 from keras_core.api_export import keras_core_export
 from keras_core.applications import imagenet_utils
 from keras_core.applications import resnet
@keras_core_export(
    [
        "keras_core.applications.resnet_v2.ResNet50V2",
        "keras_core.applications.resnet_v2.ResNet50V2",
    ]
 )
 def ResNet50V2(
    include_top=True,
    weights="imagenet",
    input_tensor=None,
    input_shape=None,
    pooling=None,
    classes=1000,
    classifier_activation="softmax",
 ):
    """Instantiates the ResNet50V2 architecture."""
    def stack_fn(x):
        x = resnet.stack_residual_blocks_v2(x, 64, 3, name="conv2")
        x = resnet.stack_residual_blocks_v2(x, 128, 4, name="conv3")
        x = resnet.stack_residual_blocks_v2(x, 256, 6, name="conv4")
        return resnet.stack_residual_blocks_v2(
            x, 512, 3, stride1=1, name="conv5"
        )
    return resnet.ResNet(
        stack_fn,
        True,
        True,
        "resnet50v2",
        include_top,
        weights,
        input_tensor,
        input_shape,
        pooling,
        classes,
        classifier_activation=classifier_activation,
    )
@keras_core_export(
    [
        "keras_core.applications.resnet_v2.ResNet101V2",
        "keras_core.applications.resnet_v2.ResNet101V2",
    ]
 )
 def ResNet101V2(
    include_top=True,
    weights="imagenet",
    input_tensor=None,
    input_shape=None,
    pooling=None,
    classes=1000,
    classifier_activation="softmax",
 ):
    """Instantiates the ResNet101V2 architecture."""
    def stack_fn(x):
        x = resnet.stack_residual_blocks_v2(x, 64, 3, name="conv2")
        x = resnet.stack_residual_blocks_v2(x, 128, 4, name="conv3")
        x = resnet.stack_residual_blocks_v2(x, 256, 23, name="conv4")
        return resnet.stack_residual_blocks_v2(
            x, 512, 3, stride1=1, name="conv5"
        )
    return resnet.ResNet(
        stack_fn,
        True,
        True,
        "resnet101v2",
        include_top,
        weights,
        input_tensor,
        input_shape,
        pooling,
        classes,
        classifier_activation=classifier_activation,
    )
@keras_core_export(
    [
        "keras_core.applications.resnet_v2.ResNet152V2",
        "keras_core.applications.resnet_v2.ResNet152V2",
    ]
 )
 def ResNet152V2(
    include_top=True,
    weights="imagenet",
    input_tensor=None,
    input_shape=None,
    pooling=None,
    classes=1000,
    classifier_activation="softmax",
 ):
    """Instantiates the ResNet152V2 architecture."""
    def stack_fn(x):
        x = resnet.stack_residual_blocks_v2(x, 64, 3, name="conv2")
        x = resnet.stack_residual_blocks_v2(x, 128, 8, name="conv3")
        x = resnet.stack_residual_blocks_v2(x, 256, 36, name="conv4")
        return resnet.stack_residual_blocks_v2(
            x, 512, 3, stride1=1, name="conv5"
        )
    return resnet.ResNet(
        stack_fn,
        True,
        True,
        "resnet152v2",
        include_top,
        weights,
        input_tensor,
        input_shape,
        pooling,
        classes,
        classifier_activation=classifier_activation,
    )
@keras_core_export("keras_core.applications.resnet_v2.preprocess_input")
 def preprocess_input(x, data_format=None):
    return imagenet_utils.preprocess_input(
        x, data_format=data_format, mode="tf"
    )
@keras_core_export("keras_core.applications.resnet_v2.decode_predictions")
 def decode_predictions(preds, top=5):
    return imagenet_utils.decode_predictions(preds, top=top)
 preprocess_input.__doc__ = imagenet_utils.PREPROCESS_INPUT_DOC.format(
    mode="",
    ret=imagenet_utils.PREPROCESS_INPUT_RET_DOC_TF,
    error=imagenet_utils.PREPROCESS_INPUT_ERROR_DOC,
 )
 decode_predictions.__doc__ = imagenet_utils.decode_predictions.__doc__
 DOC = """
 Reference:
 - [Identity Mappings in Deep Residual Networks](
    https://arxiv.org/abs/1603.05027) (CVPR 2016)
 For image classification use cases, see [this page for detailed examples](
    https://keras.io/api/applications/#usage-examples-for-image-classification-models).
 For transfer learning use cases, make sure to read the
 [guide to transfer learning & fine-tuning](
    https://keras.io/guides/transfer_learning/).
 Note: each Keras Application expects a specific kind of input preprocessing.
 For ResNet, call `keras_core.applications.resnet_v2.preprocess_input` on your
 inputs before passing them to the model. `resnet_v2.preprocess_input` will
 scale input pixels between -1 and 1.
 Args:
    include_top: whether to include the fully-connected
        layer at the top of the network.
    weights: one of `None` (random initialization),
        `"imagenet"` (pre-training on ImageNet), or the path to the weights
        file to be loaded.
    input_tensor: optional Keras tensor (i.e. output of `layers.Input()`)
        to use as image input for the model.
    input_shape: optional shape tuple, only to be specified if `include_top`
        is `False` (otherwise the input shape has to be `(224, 224, 3)`
        (with `"channels_last"` data format) or `(3, 224, 224)`
        (with `"channels_first"` data format). It should have exactly 3
        inputs channels, and width and height should be no smaller than 32.
        E.g. `(200, 200, 3)` would be one valid value.
    pooling: Optional pooling mode for feature extraction when `include_top`
        is `False`.
        - `None` means that the output of the model will be the 4D tensor
                output of the last convolutional block.
        - `avg` means that global average pooling will be applied to the output
                of the last convolutional block, and thus the output of the
                model will be a 2D tensor.
        - `max` means that global max pooling will be applied.
    classes: optional number of classes to classify images into, only to be
        specified if `include_top` is `True`, and if no `weights` argument is
        specified.
    classifier_activation: A `str` or callable. The activation function to
        use on the "top" layer. Ignored unless `include_top=True`. Set
        `classifier_activation=None` to return the logits of the "top" layer.
        When loading pretrained weights, `classifier_activation` can only
        be `None` or `"softmax"`.
 Returns:
    A Model instance.
 """
 setattr(ResNet50V2, "__doc__", ResNet50V2.__doc__ + DOC)
 setattr(ResNet101V2, "__doc__", ResNet101V2.__doc__ + DOC)
 setattr(ResNet152V2, "__doc__", ResNet152V2.__doc__ + DOC)