add blocks

anas-rz · Sep 14, 2023 · b1f889b · b1f889b
1 parent 00296e4
commit b1f889b
Showing 1 changed file with 137 additions and 0 deletions.
diff --git a/focalnet_keras_core/blocks.py b/focalnet_keras_core/blocks.py
@@ -0,0 +1,137 @@
+import keras_core as keras
+import keras.backend as K
+from focalnet_keras_core.layers import *
+
+def Mlp(hidden_features=None, dropout_rate=0., act_layer=keras.activations.gelu, out_features=None, prefix=None):
+    if prefix is not None:
+            prefix = prefix + ".mlp"
+            name = prefix  #+ str(int(K.get_uid(prefix)) - 1)
+    else:
+            name = "mlp_block"
+
+    def _apply(x):
+        in_features = x.shape[-1]
+        nonlocal hidden_features, out_features
+        out_features = out_features or in_features
+        hidden_features = hidden_features or in_features
+        x = keras.layers.Dense(hidden_features, activation=act_layer, name=f"{name}.fc1")(x)
+        x = keras.layers.Dropout(dropout_rate)(x)
+        x = keras.layers.Dense(out_features, activation=act_layer, name=f"{name}.fc2")(x)
+        x = keras.layers.Dropout(dropout_rate)(x)
+        return x
+
+    return _apply
+
+def PatchEmbed(img_size=(224, 224), patch_size=4, embed_dim=96, use_conv_embed=False, norm_layer=None, is_stem=False, prefix=None):
+
+    if prefix is None:
+        name = "patch_embed" #+ #str(int(K.get_uid("patch_embed.")) - 1)
+    else:
+        name = prefix + '.downsample'
+    def _apply(x, H, W):
+        nonlocal patch_size
+        patch_size = (patch_size, patch_size)
+        if use_conv_embed:
+            if is_stem:
+                kernel_size = 7; padding = 2; stride = 4
+            else:
+                kernel_size = 3; padding = 1; stride = 2
+
+            x = keras.layers.ZeroPadding2D(padding=padding)(x)
+            x = keras.layers.Conv2D(embed_dim, kernel_size=kernel_size, strides=stride, name=f"{name}.proj")(x)
+        else:
+            x = keras.layers.Conv2D(embed_dim, kernel_size=patch_size, strides=patch_size, name=f"{name}.proj")(x)
+        Ho, Wo, Co = x.shape[1], x.shape[2], x.shape[3]
+        x = keras.layers.Reshape((-1, Co))(x)
+        if norm_layer is not None:
+            x = norm_layer(name=f"{name}.norm")(x)
+        return x, Ho, Wo
+    return _apply
+
+def FocalNetBlock(dim, mlp_ratio=4., drop=0., drop_path=0., 
+                    act_layer=keras.activations.gelu, norm_layer=keras.layers.LayerNormalization,
+                    focal_level=1, focal_window=3,
+                    use_layerscale=False, layerscale_value=1e-4, 
+                    use_postln=False, use_postln_in_modulation=False, 
+                    normalize_modulator=False, prefix=None, **kwargs):
+
+    if prefix is not None:
+        name = prefix + '.blocks.' + str(K.get_uid(f"{prefix}.blocks." )- 1)
+    else:
+        name = 'focalnet_block'
+    def _apply(x, H, W):
+
+        C = x.shape[-1]
+        shortcut = x
+        if not use_postln:
+            x = norm_layer(name=f"{name}.norm1")(x)
+        x = keras.layers.Reshape((H, W, C))(x)
+        x = FocalModulation(dim, proj_drop=drop, focal_window=focal_window, focal_level=focal_level, 
+            use_postln_in_modulation=use_postln_in_modulation, normalize_modulator=normalize_modulator, prefix=name)(x)
+        x = keras.layers.Reshape((H * W, C))(x)
+        if use_postln:
+            x = norm_layer(name=f"{name}.norm1")(x)
+        if use_layerscale:
+            x = LayerScale(layerscale_value, dim)(x)
+        x = StochasticDepth(drop_path)(x)
+        x = keras.layers.Add()([shortcut, x])
+        x = keras.layers.Reshape((H, W, C))(x)
+        if use_postln:
+            x_alt = Mlp(hidden_features=dim * mlp_ratio, dropout_rate=drop, prefix=name)(x)
+            x_alt = norm_layer(name=f"{name}.norm2")(x_alt)
+            if use_layerscale:
+                x_alt = LayerScale(layerscale_value, dim)(x_alt)
+            x_alt = StochasticDepth(drop_path)(x_alt)
+            x = keras.layers.Add()([x_alt, x])
+        else:
+            x_alt = norm_layer(name=f"{name}.norm2")(x)
+            x_alt = Mlp(hidden_features=dim * mlp_ratio, dropout_rate=drop, prefix=name)(x_alt)
+            x_alt = StochasticDepth(drop_path)(x_alt)
+            x = keras.layers.Add()([x_alt, x])
+        x = keras.layers.Reshape((H * W, C))(x)
+        return x
+    return _apply
+
+def BasicLayer(dim, depth, out_dim, input_resolution,
+                 mlp_ratio=4., drop=0., drop_path=0., norm_layer=keras.layers.LayerNormalization, 
+                 downsample=None,  #use_checkpoint=False, 
+                 focal_level=1, focal_window=1, 
+                 use_conv_embed=False, 
+                 use_layerscale=False, layerscale_value=1e-4, 
+                 use_postln=False, 
+                 use_postln_in_modulation=False, 
+                 normalize_modulator=False, name=None):
+    if name is None:
+        name = "layers." + str(K.get_uid("layers.") - 1)
+    def _apply(x, H, W):
+        for i in range(depth):
+            x = FocalNetBlock(
+                    dim=dim, 
+                    mlp_ratio=mlp_ratio, 
+                    drop=drop, 
+                    drop_path=drop_path[i] if isinstance(drop_path, list) else drop_path,
+                    norm_layer=norm_layer,
+                    focal_level=focal_level,
+                    focal_window=focal_window, 
+                    use_layerscale=use_layerscale, 
+                    layerscale_value=layerscale_value,
+                    use_postln=use_postln, 
+                    use_postln_in_modulation=use_postln_in_modulation, 
+                    normalize_modulator=normalize_modulator, 
+                prefix=name)(x, H, W)
+            # print(x.shape)
+        if downsample is not None:
+            C = x.shape[-1]
+            x = keras.layers.Reshape((H, W, C))(x)
+            x, Ho, Wo = downsample(img_size=input_resolution, 
+                patch_size=2, 
+                # in_chans=dim, 
+                embed_dim=out_dim, 
+                use_conv_embed=use_conv_embed, 
+                norm_layer=norm_layer, 
+                is_stem=False,
+                prefix=name)(x, H, W)
+            H, W = Ho, Wo
+
+        return x, H, W
+    return _apply