Spaces:

awsaf49
/

gcvit-tf

Running

App Files Files Community

awsaf49 commited on Feb 2, 2023

Commit

31b7180

•

2 Parent(s): 28f10f6 21fa3d7

Merge branch 'main' of https://huggingface.co/spaces/awsaf49/gcvit-tf into main

Browse files

Files changed (23) hide show

.gitattributes +31 -31
README.md +13 -13
example/Standing_jaguar.jpg +0 -0
gcvit/__pycache__/__init__.cpython-38.pyc +0 -0
gcvit/layers/__init__.py +7 -7
gcvit/layers/__pycache__/__init__.cpython-38.pyc +0 -0
gcvit/layers/__pycache__/attention.cpython-38.pyc +0 -0
gcvit/layers/__pycache__/block.cpython-38.pyc +0 -0
gcvit/layers/__pycache__/drop.cpython-38.pyc +0 -0
gcvit/layers/__pycache__/embedding.cpython-38.pyc +0 -0
gcvit/layers/__pycache__/feature.cpython-38.pyc +0 -0
gcvit/layers/__pycache__/level.cpython-38.pyc +0 -0
gcvit/layers/__pycache__/window.cpython-38.pyc +0 -0
gcvit/layers/block.py +98 -98
gcvit/layers/embedding.py +1 -1
gcvit/layers/feature.py +254 -201
gcvit/layers/level.py +84 -92
gcvit/models/__pycache__/__init__.cpython-38.pyc +0 -0
gcvit/models/__pycache__/gcvit.cpython-38.pyc +0 -0
gcvit/models/gcvit.py +55 -0
gcvit/version.py +1 -1
requirements.txt +4 -4
setup.py +0 -50

.gitattributes CHANGED Viewed

@@ -1,31 +1,31 @@
-*.7z filter=lfs diff=lfs merge=lfs -text
-*.arrow filter=lfs diff=lfs merge=lfs -text
-*.bin filter=lfs diff=lfs merge=lfs -text
-*.bz2 filter=lfs diff=lfs merge=lfs -text
-*.ftz filter=lfs diff=lfs merge=lfs -text
-*.gz filter=lfs diff=lfs merge=lfs -text
-*.h5 filter=lfs diff=lfs merge=lfs -text
-*.joblib filter=lfs diff=lfs merge=lfs -text
-*.lfs.* filter=lfs diff=lfs merge=lfs -text
-*.model filter=lfs diff=lfs merge=lfs -text
-*.msgpack filter=lfs diff=lfs merge=lfs -text
-*.npy filter=lfs diff=lfs merge=lfs -text
-*.npz filter=lfs diff=lfs merge=lfs -text
-*.onnx filter=lfs diff=lfs merge=lfs -text
-*.ot filter=lfs diff=lfs merge=lfs -text
-*.parquet filter=lfs diff=lfs merge=lfs -text
-*.pickle filter=lfs diff=lfs merge=lfs -text
-*.pkl filter=lfs diff=lfs merge=lfs -text
-*.pb filter=lfs diff=lfs merge=lfs -text
-*.pt filter=lfs diff=lfs merge=lfs -text
-*.pth filter=lfs diff=lfs merge=lfs -text
-*.rar filter=lfs diff=lfs merge=lfs -text
-saved_model/**/* filter=lfs diff=lfs merge=lfs -text
-*.tar.* filter=lfs diff=lfs merge=lfs -text
-*.tflite filter=lfs diff=lfs merge=lfs -text
-*.tgz filter=lfs diff=lfs merge=lfs -text
-*.wasm filter=lfs diff=lfs merge=lfs -text
-*.xz filter=lfs diff=lfs merge=lfs -text
-*.zip filter=lfs diff=lfs merge=lfs -text
-*.zstandard filter=lfs diff=lfs merge=lfs -text
-*tfevents* filter=lfs diff=lfs merge=lfs -text

+*.7z filter=lfs diff=lfs merge=lfs -text
+*.arrow filter=lfs diff=lfs merge=lfs -text
+*.bin filter=lfs diff=lfs merge=lfs -text
+*.bz2 filter=lfs diff=lfs merge=lfs -text
+*.ftz filter=lfs diff=lfs merge=lfs -text
+*.gz filter=lfs diff=lfs merge=lfs -text
+*.h5 filter=lfs diff=lfs merge=lfs -text
+*.joblib filter=lfs diff=lfs merge=lfs -text
+*.lfs.* filter=lfs diff=lfs merge=lfs -text
+*.model filter=lfs diff=lfs merge=lfs -text
+*.msgpack filter=lfs diff=lfs merge=lfs -text
+*.npy filter=lfs diff=lfs merge=lfs -text
+*.npz filter=lfs diff=lfs merge=lfs -text
+*.onnx filter=lfs diff=lfs merge=lfs -text
+*.ot filter=lfs diff=lfs merge=lfs -text
+*.parquet filter=lfs diff=lfs merge=lfs -text
+*.pickle filter=lfs diff=lfs merge=lfs -text
+*.pkl filter=lfs diff=lfs merge=lfs -text
+*.pb filter=lfs diff=lfs merge=lfs -text
+*.pt filter=lfs diff=lfs merge=lfs -text
+*.pth filter=lfs diff=lfs merge=lfs -text
+*.rar filter=lfs diff=lfs merge=lfs -text
+saved_model/**/* filter=lfs diff=lfs merge=lfs -text
+*.tar.* filter=lfs diff=lfs merge=lfs -text
+*.tflite filter=lfs diff=lfs merge=lfs -text
+*.tgz filter=lfs diff=lfs merge=lfs -text
+*.wasm filter=lfs diff=lfs merge=lfs -text
+*.xz filter=lfs diff=lfs merge=lfs -text
+*.zip filter=lfs diff=lfs merge=lfs -text
+*.zstandard filter=lfs diff=lfs merge=lfs -text
+*tfevents* filter=lfs diff=lfs merge=lfs -text

README.md CHANGED Viewed

@@ -1,13 +1,13 @@
----
-title: Gcvit Tf
-emoji: 📈
-colorFrom: yellow
-colorTo: purple
-sdk: gradio
-sdk_version: 3.1.0
-app_file: app.py
-pinned: false
-license: mit
----
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

+---
+title: Gcvit Tf
+emoji: 📈
+colorFrom: yellow
+colorTo: purple
+sdk: gradio
+sdk_version: 3.1.0
+app_file: app.py
+pinned: false
+license: mit
+---
+Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

example/Standing_jaguar.jpg ADDED Viewed

gcvit/__pycache__/__init__.cpython-38.pyc DELETED Viewed

Binary file (228 Bytes)

gcvit/layers/__init__.py CHANGED Viewed

@@ -1,7 +1,7 @@
-from .window import window_partition, window_reverse
-from .attention import WindowAttention
-from .drop import DropPath, Identity
-from .embedding import PatchEmbed
-from .feature import Mlp, FeatExtract, ReduceSize, SE, Resizing
-from .block import GCViTBlock
-from .level import GCViTLayer

+from .window import window_partition, window_reverse
+from .attention import WindowAttention
+from .drop import DropPath, Identity
+from .embedding import Stem
+from .feature import Mlp, FeatExtract, ReduceSize, SE, Resizing
+from .block import GCViTBlock
+from .level import GCViTLevel

gcvit/layers/__pycache__/__init__.cpython-38.pyc DELETED Viewed

Binary file (530 Bytes)

gcvit/layers/__pycache__/attention.cpython-38.pyc DELETED Viewed

Binary file (3.58 kB)

gcvit/layers/__pycache__/block.cpython-38.pyc DELETED Viewed

Binary file (3 kB)

gcvit/layers/__pycache__/drop.cpython-38.pyc DELETED Viewed

Binary file (1.8 kB)

gcvit/layers/__pycache__/embedding.cpython-38.pyc DELETED Viewed

Binary file (1.39 kB)

gcvit/layers/__pycache__/feature.cpython-38.pyc DELETED Viewed

Binary file (5.5 kB)

gcvit/layers/__pycache__/level.cpython-38.pyc DELETED Viewed

Binary file (3 kB)

gcvit/layers/__pycache__/window.cpython-38.pyc DELETED Viewed

Binary file (801 Bytes)

gcvit/layers/block.py CHANGED Viewed

@@ -1,99 +1,99 @@
-import tensorflow as tf
-from .attention import WindowAttention
-from .drop import DropPath
-from .window import window_partition, window_reverse
-from .feature import Mlp, FeatExtract
-@tf.keras.utils.register_keras_serializable(package="gcvit")
-class GCViTBlock(tf.keras.layers.Layer):
-    def __init__(self, window_size, num_heads, global_query, mlp_ratio=4., qkv_bias=True, qk_scale=None, drop=0.,
-                 attn_drop=0., path_drop=0., act_layer='gelu', layer_scale=None, **kwargs):
-        super().__init__(**kwargs)
-        self.window_size = window_size
-        self.num_heads = num_heads
-        self.global_query = global_query
-        self.mlp_ratio = mlp_ratio
-        self.qkv_bias = qkv_bias
-        self.qk_scale = qk_scale
-        self.drop = drop
-        self.attn_drop = attn_drop
-        self.path_drop = path_drop
-        self.act_layer = act_layer
-        self.layer_scale = layer_scale
-    def build(self, input_shape):
-        B, H, W, C = input_shape[0]
-        self.norm1 = tf.keras.layers.LayerNormalization(axis=-1, epsilon=1e-05, name='norm1')
-        self.attn = WindowAttention(window_size=self.window_size,
-                                   num_heads=self.num_heads,
-                                   global_query=self.global_query,
-                                   qkv_bias=self.qkv_bias,
-                                   qk_scale=self.qk_scale,
-                                   attn_dropout=self.attn_drop,
-                                   proj_dropout=self.drop,
-                                   name='attn')
-        self.drop_path1 = DropPath(self.path_drop)
-        self.drop_path2 = DropPath(self.path_drop)
-        self.norm2 = tf.keras.layers.LayerNormalization(axis=-1, epsilon=1e-05, name='norm2')
-        self.mlp = Mlp(hidden_features=int(C * self.mlp_ratio), dropout=self.drop, act_layer=self.act_layer, name='mlp')
-        if self.layer_scale is not None:
-            self.gamma1 = self.add_weight(
-                'gamma1',
-                shape=[C],
-                initializer=tf.keras.initializers.Constant(self.layer_scale),
-                trainable=True,
-                dtype=self.dtype)
-            self.gamma2 = self.add_weight(
-                'gamma2',
-                shape=[C],
-                initializer=tf.keras.initializers.Constant(self.layer_scale),
-                trainable=True,
-                dtype=self.dtype)
-        else:
-            self.gamma1 = 1.0
-            self.gamma2 = 1.0
-        self.num_windows = int(H // self.window_size) * int(W // self.window_size)
-        super().build(input_shape)
-    def call(self, inputs, **kwargs):
-        if self.global_query:
-            inputs, q_global = inputs
-        else:
-            inputs = inputs[0]
-        B, H, W, C = tf.unstack(tf.shape(inputs), num=4)
-        x = self.norm1(inputs)
-        # create windows and concat them in batch axis
-        x = window_partition(x, self.window_size)  # (B_, win_h, win_w, C)
-        # flatten patch
-        x = tf.reshape(x, shape=[-1, self.window_size * self.window_size, C])  # (B_, N, C) => (batch*num_win, num_token, feature)
-        # attention
-        if self.global_query:
-            x = self.attn([x, q_global])
-        else:
-            x = self.attn([x])
-        # reverse window partition
-        x = window_reverse(x, self.window_size, H, W, C)
-        # FFN
-        x = inputs + self.drop_path1(x * self.gamma1)
-        x = x + self.drop_path2(self.gamma2 * self.mlp(self.norm2(x)))
-        return x
-    def get_config(self):
-        config = super().get_config()
-        config.update({
-            'window_size': self.window_size,
-            'num_heads': self.num_heads,
-            'global_query': self.global_query,
-            'mlp_ratio': self.mlp_ratio,
-            'qkv_bias': self.qkv_bias,
-            'qk_scale': self.qk_scale,
-            'drop': self.drop,
-            'attn_drop': self.attn_drop,
-            'path_drop': self.path_drop,
-            'act_layer': self.act_layer,
-            'layer_scale': self.layer_scale,
-            'num_windows': self.num_windows,
-        })
         return config

+import tensorflow as tf
+from .attention import WindowAttention
+from .drop import DropPath
+from .window import window_partition, window_reverse
+from .feature import Mlp, FeatExtract
+@tf.keras.utils.register_keras_serializable(package="gcvit")
+class GCViTBlock(tf.keras.layers.Layer):
+    def __init__(self, window_size, num_heads, global_query, mlp_ratio=4., qkv_bias=True, qk_scale=None, drop=0.,
+                 attn_drop=0., path_drop=0., act_layer='gelu', layer_scale=None, **kwargs):
+        super().__init__(**kwargs)
+        self.window_size = window_size
+        self.num_heads = num_heads
+        self.global_query = global_query
+        self.mlp_ratio = mlp_ratio
+        self.qkv_bias = qkv_bias
+        self.qk_scale = qk_scale
+        self.drop = drop
+        self.attn_drop = attn_drop
+        self.path_drop = path_drop
+        self.act_layer = act_layer
+        self.layer_scale = layer_scale
+    def build(self, input_shape):
+        B, H, W, C = input_shape[0]
+        self.norm1 = tf.keras.layers.LayerNormalization(axis=-1, epsilon=1e-05, name='norm1')
+        self.attn = WindowAttention(window_size=self.window_size,
+                                   num_heads=self.num_heads,
+                                   global_query=self.global_query,
+                                   qkv_bias=self.qkv_bias,
+                                   qk_scale=self.qk_scale,
+                                   attn_dropout=self.attn_drop,
+                                   proj_dropout=self.drop,
+                                   name='attn')
+        self.drop_path1 = DropPath(self.path_drop)
+        self.drop_path2 = DropPath(self.path_drop)
+        self.norm2 = tf.keras.layers.LayerNormalization(axis=-1, epsilon=1e-05, name='norm2')
+        self.mlp = Mlp(hidden_features=int(C * self.mlp_ratio), dropout=self.drop, act_layer=self.act_layer, name='mlp')
+        if self.layer_scale is not None:
+            self.gamma1 = self.add_weight(
+                'gamma1',
+                shape=[C],
+                initializer=tf.keras.initializers.Constant(self.layer_scale),
+                trainable=True,
+                dtype=self.dtype)
+            self.gamma2 = self.add_weight(
+                'gamma2',
+                shape=[C],
+                initializer=tf.keras.initializers.Constant(self.layer_scale),
+                trainable=True,
+                dtype=self.dtype)
+        else:
+            self.gamma1 = 1.0
+            self.gamma2 = 1.0
+        self.num_windows = int(H // self.window_size) * int(W // self.window_size)
+        super().build(input_shape)
+    def call(self, inputs, **kwargs):
+        if self.global_query:
+            inputs, q_global = inputs
+        else:
+            inputs = inputs[0]
+        B, H, W, C = tf.unstack(tf.shape(inputs), num=4)
+        x = self.norm1(inputs)
+        # create windows and concat them in batch axis
+        x = window_partition(x, self.window_size)  # (B_, win_h, win_w, C)
+        # flatten patch
+        x = tf.reshape(x, shape=[-1, self.window_size * self.window_size, C])  # (B_, N, C) => (batch*num_win, num_token, feature)
+        # attention
+        if self.global_query:
+            x = self.attn([x, q_global])
+        else:
+            x = self.attn([x])
+        # reverse window partition
+        x = window_reverse(x, self.window_size, H, W, C)
+        # FFN
+        x = inputs + self.drop_path1(x * self.gamma1)
+        x = x + self.drop_path2(self.gamma2 * self.mlp(self.norm2(x)))
+        return x
+    def get_config(self):
+        config = super().get_config()
+        config.update({
+            'window_size': self.window_size,
+            'num_heads': self.num_heads,
+            'global_query': self.global_query,
+            'mlp_ratio': self.mlp_ratio,
+            'qkv_bias': self.qkv_bias,
+            'qk_scale': self.qk_scale,
+            'drop': self.drop,
+            'attn_drop': self.attn_drop,
+            'path_drop': self.path_drop,
+            'act_layer': self.act_layer,
+            'layer_scale': self.layer_scale,
+            'num_windows': self.num_windows,
+        })
         return config

gcvit/layers/embedding.py CHANGED Viewed

@@ -4,7 +4,7 @@ from .feature import ReduceSize
 @tf.keras.utils.register_keras_serializable(package="gcvit")
-class PatchEmbed(tf.keras.layers.Layer):
     def __init__(self, dim, **kwargs):
         super().__init__(**kwargs)
         self.dim = dim

 @tf.keras.utils.register_keras_serializable(package="gcvit")
+class Stem(tf.keras.layers.Layer):
     def __init__(self, dim, **kwargs):
         super().__init__(**kwargs)
         self.dim = dim

gcvit/layers/feature.py CHANGED Viewed

@@ -1,202 +1,255 @@
-import tensorflow as tf
-import tensorflow_addons as tfa
-H_AXIS = -3
-W_AXIS = -2
-@tf.keras.utils.register_keras_serializable(package="gcvit")
-class Mlp(tf.keras.layers.Layer):
-    def __init__(self, hidden_features=None, out_features=None, act_layer='gelu', dropout=0., **kwargs):
-        super().__init__(**kwargs)
-        self.hidden_features = hidden_features
-        self.out_features = out_features
-        self.act_layer = act_layer
-        self.dropout = dropout
-    def build(self, input_shape):
-        self.in_features = input_shape[-1]
-        self.hidden_features = self.hidden_features or self.in_features
-        self.out_features = self.out_features or self.in_features
-        self.fc1 = tf.keras.layers.Dense(self.hidden_features, name="fc1")
-        self.act = tf.keras.layers.Activation(self.act_layer, name="act")
-        self.fc2 = tf.keras.layers.Dense(self.out_features, name="fc2")
-        self.drop1 = tf.keras.layers.Dropout(self.dropout, name="drop1")
-        self.drop2 = tf.keras.layers.Dropout(self.dropout, name="drop2")
-        super().build(input_shape)
-    def call(self, inputs, **kwargs):
-        x = self.fc1(inputs)
-        x = self.act(x)
-        x = self.drop1(x)
-        x = self.fc2(x)
-        x = self.drop2(x)
-        return x
-    def get_config(self):
-        config = super().get_config()
-        config.update({
-            "hidden_features":self.hidden_features,
-            "out_features":self.out_features,
-            "act_layer":self.act_layer,
-            "dropout":self.dropout
-            })
-        return config
-@tf.keras.utils.register_keras_serializable(package="gcvit")
-class SE(tf.keras.layers.Layer):
-    def __init__(self, oup=None, expansion=0.25, **kwargs):
-        super().__init__(**kwargs)
-        self.expansion = expansion
-        self.oup = oup
-    def build(self, input_shape):
-        inp = input_shape[-1]
-        self.oup = self.oup or inp
-        self.avg_pool = tfa.layers.AdaptiveAveragePooling2D(1, name="avg_pool")
-        self.fc = [
-            tf.keras.layers.Dense(int(inp * self.expansion), use_bias=False, name='fc/0'),
-            tf.keras.layers.Activation('gelu', name='fc/1'),
-            tf.keras.layers.Dense(self.oup, use_bias=False, name='fc/2'),
-            tf.keras.layers.Activation('sigmoid', name='fc/3')
-            ]
-        super().build(input_shape)
-    def call(self, inputs, **kwargs):
-        b, _, _, c = tf.unstack(tf.shape(inputs), num=4)
-        x = tf.reshape(self.avg_pool(inputs), (b, c))
-        for layer in self.fc:
-            x = layer(x)
-        x = tf.reshape(x, (b, 1, 1, c))
-        return x*inputs
-    def get_config(self):
-        config = super().get_config()
-        config.update({
-            'expansion': self.expansion,
-            'oup': self.oup,
-            })
-        return config
-@tf.keras.utils.register_keras_serializable(package="gcvit")
-class ReduceSize(tf.keras.layers.Layer):
-    def __init__(self, keep_dim=False, **kwargs):
-        super().__init__(**kwargs)
-        self.keep_dim = keep_dim
-    def build(self, input_shape):
-        dim = input_shape[-1]
-        dim_out = dim if self.keep_dim else 2*dim
-        self.pad1 = tf.keras.layers.ZeroPadding2D(1, name='pad1')
-        self.pad2 = tf.keras.layers.ZeroPadding2D(1, name='pad2')
-        self.conv = [
-            tf.keras.layers.DepthwiseConv2D(kernel_size=3, strides=1, padding='valid', use_bias=False, name='conv/0'),
-            tf.keras.layers.Activation('gelu', name='conv/1'),
-            SE(name='conv/2'),
-            tf.keras.layers.Conv2D(dim, kernel_size=1, strides=1, padding='valid', use_bias=False, name='conv/3')
-        ]
-        self.reduction = tf.keras.layers.Conv2D(dim_out, kernel_size=3, strides=2, padding='valid', use_bias=False,
-                                                name='reduction')
-        self.norm1 = tf.keras.layers.LayerNormalization(axis=-1, epsilon=1e-05, name='norm1')  # eps like PyTorch
-        self.norm2 = tf.keras.layers.LayerNormalization(axis=-1, epsilon=1e-05, name='norm2')
-        super().build(input_shape)
-    def call(self, inputs, **kwargs):
-        x = self.norm1(inputs)
-        xr = self.pad1(x)  # if pad had weights it would've thrown error with .save_weights()
-        for layer in self.conv:
-            xr = layer(xr)
-        x = x + xr
-        x = self.pad2(x)
-        x = self.reduction(x)
-        x = self.norm2(x)
-        return x
-    def get_config(self):
-        config = super().get_config()
-        config.update({
-            "keep_dim":self.keep_dim,
-        })
-        return config
-@tf.keras.utils.register_keras_serializable(package="gcvit")
-class FeatExtract(tf.keras.layers.Layer):
-    def __init__(self, keep_dim=False, **kwargs):
-        super().__init__(**kwargs)
-        self.keep_dim = keep_dim
-    def build(self, input_shape):
-        dim = input_shape[-1]
-        self.pad1 = tf.keras.layers.ZeroPadding2D(1, name='pad1')
-        self.pad2 = tf.keras.layers.ZeroPadding2D(1, name='pad2')
-        self.conv = [
-            tf.keras.layers.DepthwiseConv2D(kernel_size=3, strides=1, padding='valid', use_bias=False, name='conv/0'),
-            tf.keras.layers.Activation('gelu', name='conv/1'),
-            SE(name='conv/2'),
-            tf.keras.layers.Conv2D(dim, kernel_size=1, strides=1, padding='valid', use_bias=False, name='conv/3')
-        ]
-        if not self.keep_dim:
-            self.pool = tf.keras.layers.MaxPool2D(pool_size=3, strides=2, padding='valid', name='pool')
-        # else:
-        #     self.pool = tf.keras.layers.Activation('linear', name='identity')  # hack for PyTorch nn.Identity layer ;)
-        super().build(input_shape)
-    def call(self, inputs, **kwargs):
-        x = inputs
-        xr = self.pad1(x)
-        for layer in self.conv:
-            xr = layer(xr)
-        x = x + xr # if pad had weights it would've thrown error with .save_weights()
-        if not self.keep_dim:
-            x = self.pad2(x)
-            x = self.pool(x)
-        return x
-    def get_config(self):
-        config = super().get_config()
-        config.update({
-            "keep_dim":self.keep_dim,
-        })
-        return config
-@tf.keras.utils.register_keras_serializable(package="gcvit")
-class Resizing(tf.keras.layers.Layer):
-    def __init__(self,
-               height,
-               width,
-               interpolation='bilinear',
-               **kwargs):
-        self.height = height
-        self.width = width
-        self.interpolation = interpolation
-        super().__init__(**kwargs)
-    def call(self, inputs):
-        # tf.image.resize will always output float32 and operate more efficiently on
-        # float32 unless interpolation is nearest, in which case ouput type matches
-        # input type.
-        if self.interpolation == 'nearest':
-            input_dtype = self.compute_dtype
-        else:
-            input_dtype = tf.float32
-        inputs = tf.cast(inputs, dtype=input_dtype)
-        size = [self.height, self.width]
-        outputs = tf.image.resize(
-            inputs,
-            size=size,
-            method=self.interpolation)
-        return tf.cast(outputs, self.compute_dtype)
-    def compute_output_shape(self, input_shape):
-        input_shape = tf.TensorShape(input_shape).as_list()
-        input_shape[H_AXIS] = self.height
-        input_shape[W_AXIS] = self.width
-        return tf.TensorShape(input_shape)
-    def get_config(self):
-        config = super().get_config()
-        config.update({
-            'height': self.height,
-            'width': self.width,
-            'interpolation': self.interpolation,
-            })
         return config

+import tensorflow as tf
+import tensorflow_addons as tfa
+H_AXIS = -3
+W_AXIS = -2
+@tf.keras.utils.register_keras_serializable(package="gcvit")
+class Mlp(tf.keras.layers.Layer):
+    def __init__(self, hidden_features=None, out_features=None, act_layer='gelu', dropout=0., **kwargs):
+        super().__init__(**kwargs)
+        self.hidden_features = hidden_features
+        self.out_features = out_features
+        self.act_layer = act_layer
+        self.dropout = dropout
+    def build(self, input_shape):
+        self.in_features = input_shape[-1]
+        self.hidden_features = self.hidden_features or self.in_features
+        self.out_features = self.out_features or self.in_features
+        self.fc1 = tf.keras.layers.Dense(self.hidden_features, name="fc1")
+        self.act = tf.keras.layers.Activation(self.act_layer, name="act")
+        self.fc2 = tf.keras.layers.Dense(self.out_features, name="fc2")
+        self.drop1 = tf.keras.layers.Dropout(self.dropout, name="drop1")
+        self.drop2 = tf.keras.layers.Dropout(self.dropout, name="drop2")
+        super().build(input_shape)
+    def call(self, inputs, **kwargs):
+        x = self.fc1(inputs)
+        x = self.act(x)
+        x = self.drop1(x)
+        x = self.fc2(x)
+        x = self.drop2(x)
+        return x
+    def get_config(self):
+        config = super().get_config()
+        config.update({
+            "hidden_features":self.hidden_features,
+            "out_features":self.out_features,
+            "act_layer":self.act_layer,
+            "dropout":self.dropout
+            })
+        return config
+@tf.keras.utils.register_keras_serializable(package="gcvit")
+class SE(tf.keras.layers.Layer):
+    def __init__(self, oup=None, expansion=0.25, **kwargs):
+        super().__init__(**kwargs)
+        self.expansion = expansion
+        self.oup = oup
+    def build(self, input_shape):
+        inp = input_shape[-1]
+        self.oup = self.oup or inp
+        self.avg_pool = tfa.layers.AdaptiveAveragePooling2D(1, name="avg_pool")
+        self.fc = [
+            tf.keras.layers.Dense(int(inp * self.expansion), use_bias=False, name='fc/0'),
+            tf.keras.layers.Activation('gelu', name='fc/1'),
+            tf.keras.layers.Dense(self.oup, use_bias=False, name='fc/2'),
+            tf.keras.layers.Activation('sigmoid', name='fc/3')
+            ]
+        super().build(input_shape)
+    def call(self, inputs, **kwargs):
+        b, _, _, c = tf.unstack(tf.shape(inputs), num=4)
+        x = tf.reshape(self.avg_pool(inputs), (b, c))
+        for layer in self.fc:
+            x = layer(x)
+        x = tf.reshape(x, (b, 1, 1, c))
+        return x*inputs
+    def get_config(self):
+        config = super().get_config()
+        config.update({
+            'expansion': self.expansion,
+            'oup': self.oup,
+            })
+        return config
+@tf.keras.utils.register_keras_serializable(package="gcvit")
+class ReduceSize(tf.keras.layers.Layer):
+    def __init__(self, keep_dim=False, **kwargs):
+        super().__init__(**kwargs)
+        self.keep_dim = keep_dim
+    def build(self, input_shape):
+        dim = input_shape[-1]
+        dim_out = dim if self.keep_dim else 2*dim
+        self.pad1 = tf.keras.layers.ZeroPadding2D(1, name='pad1')
+        self.pad2 = tf.keras.layers.ZeroPadding2D(1, name='pad2')
+        self.conv = [
+            tf.keras.layers.DepthwiseConv2D(kernel_size=3, strides=1, padding='valid', use_bias=False, name='conv/0'),
+            tf.keras.layers.Activation('gelu', name='conv/1'),
+            SE(name='conv/2'),
+            tf.keras.layers.Conv2D(dim, kernel_size=1, strides=1, padding='valid', use_bias=False, name='conv/3')
+        ]
+        self.reduction = tf.keras.layers.Conv2D(dim_out, kernel_size=3, strides=2, padding='valid', use_bias=False,
+                                                name='reduction')
+        self.norm1 = tf.keras.layers.LayerNormalization(axis=-1, epsilon=1e-05, name='norm1')  # eps like PyTorch
+        self.norm2 = tf.keras.layers.LayerNormalization(axis=-1, epsilon=1e-05, name='norm2')
+        super().build(input_shape)
+    def call(self, inputs, **kwargs):
+        x = self.norm1(inputs)
+        xr = self.pad1(x)  # if pad had weights it would've thrown error with .save_weights()
+        for layer in self.conv:
+            xr = layer(xr)
+        x = x + xr
+        x = self.pad2(x)
+        x = self.reduction(x)
+        x = self.norm2(x)
+        return x
+    def get_config(self):
+        config = super().get_config()
+        config.update({
+            "keep_dim":self.keep_dim,
+        })
+        return config
+@tf.keras.utils.register_keras_serializable(package="gcvit")
+class FeatExtract(tf.keras.layers.Layer):
+    def __init__(self, keep_dim=False, **kwargs):
+        super().__init__(**kwargs)
+        self.keep_dim = keep_dim
+    def build(self, input_shape):
+        dim = input_shape[-1]
+        self.pad1 = tf.keras.layers.ZeroPadding2D(1, name='pad1')
+        self.pad2 = tf.keras.layers.ZeroPadding2D(1, name='pad2')
+        self.conv = [
+            tf.keras.layers.DepthwiseConv2D(kernel_size=3, strides=1, padding='valid', use_bias=False, name='conv/0'),
+            tf.keras.layers.Activation('gelu', name='conv/1'),
+            SE(name='conv/2'),
+            tf.keras.layers.Conv2D(dim, kernel_size=1, strides=1, padding='valid', use_bias=False, name='conv/3')
+        ]
+        if not self.keep_dim:
+            self.pool = tf.keras.layers.MaxPool2D(pool_size=3, strides=2, padding='valid', name='pool')
+        # else:
+        #     self.pool = tf.keras.layers.Activation('linear', name='identity')  # hack for PyTorch nn.Identity layer ;)
+        super().build(input_shape)
+    def call(self, inputs, **kwargs):
+        x = inputs
+        xr = self.pad1(x)
+        for layer in self.conv:
+            xr = layer(xr)
+        x = x + xr # if pad had weights it would've thrown error with .save_weights()
+        if not self.keep_dim:
+            x = self.pad2(x)
+            x = self.pool(x)
+        return x
+    def get_config(self):
+        config = super().get_config()
+        config.update({
+            "keep_dim":self.keep_dim,
+        })
+        return config
+@tf.keras.utils.register_keras_serializable(package="gcvit")
+class  GlobalQueryGen(tf.keras.layers.Layer):
+    """
+    Global query generator based on: "Hatamizadeh et al.,
+    Global Context Vision Transformers <https://arxiv.org/abs/2206.09959>"
+    """
+    def __init__(self, keep_dims=False, **kwargs):
+        super().__init__(**kwargs)
+        self.keep_dims = keep_dims
+    def build(self, input_shape):
+        self.to_q_global = [FeatExtract(keep_dim, name=f'to_q_global/{i}') \
+                            for i, keep_dim in enumerate(self.keep_dims)]
+        super().build(input_shape)
+    def call(self, inputs, **kwargs):
+        x = inputs
+        for layer in self.to_q_global:
+            x = layer(x)
+        return x
+    def get_config(self):
+        config = super().get_config()
+        config.update({
+            "keep_dims":self.keep_dims,
+        })
+        return config
+@tf.keras.utils.register_keras_serializable(package="gcvit")
+class Resizing(tf.keras.layers.Layer):
+    def __init__(self,
+               height,
+               width,
+               interpolation='bilinear',
+               **kwargs):
+        self.height = height
+        self.width = width
+        self.interpolation = interpolation
+        super().__init__(**kwargs)
+    def call(self, inputs):
+        # tf.image.resize will always output float32 and operate more efficiently on
+        # float32 unless interpolation is nearest, in which case ouput type matches
+        # input type.
+        if self.interpolation == 'nearest':
+            input_dtype = self.compute_dtype
+        else:
+            input_dtype = tf.float32
+        inputs = tf.cast(inputs, dtype=input_dtype)
+        size = [self.height, self.width]
+        outputs = tf.image.resize(
+            inputs,
+            size=size,
+            method=self.interpolation)
+        return tf.cast(outputs, self.compute_dtype)
+    def compute_output_shape(self, input_shape):
+        input_shape = tf.TensorShape(input_shape).as_list()
+        input_shape[H_AXIS] = self.height
+        input_shape[W_AXIS] = self.width
+        return tf.TensorShape(input_shape)
+    def get_config(self):
+        config = super().get_config()
+        config.update({
+            'height': self.height,
+            'width': self.width,
+            'interpolation': self.interpolation,
+            })
+        return config
+@tf.keras.utils.register_keras_serializable(package="gcvit")
+class FitWindow(tf.keras.layers.Layer):
+    "Pad feature to fit window"
+    def __init__(self, window_size, **kwargs):
+        super().__init__(**kwargs)
+        self.window_size = window_size
+    def call(self, inputs):
+        B, H, W, C = tf.unstack(tf.shape(inputs), num=4)
+        # pad to multiple of window_size
+        h_pad = (self.window_size - H % self.window_size) % self.window_size
+        w_pad = (self.window_size - W % self.window_size) % self.window_size
+        x = tf.pad(inputs, [[0, 0],
+                            [h_pad//2, (h_pad//2 + h_pad%2)],  # padding in both directions unlike tfgcvit
+                            [w_pad//2, (w_pad//2 + w_pad%2)],
+                            [0, 0]])
+        return x
+    def get_config(self):
+        config = super().get_config()
+        config.update({
+            'window_size': self.window_size,
+            })
         return config

gcvit/layers/level.py CHANGED Viewed

@@ -1,93 +1,85 @@
-import tensorflow as tf
-from .feature import FeatExtract, ReduceSize, Resizing
-from .block import GCViTBlock
-@tf.keras.utils.register_keras_serializable(package="gcvit")
-class GCViTLayer(tf.keras.layers.Layer):
-    def __init__(self, depth, num_heads, window_size, keep_dims, downsample=True, mlp_ratio=4., qkv_bias=True,
-                qk_scale=None, drop=0., attn_drop=0., path_drop=0., layer_scale=None, resize_query=False, **kwargs):
-        super().__init__(**kwargs)
-        self.depth = depth
-        self.num_heads = num_heads
-        self.window_size = window_size
-        self.keep_dims = keep_dims
-        self.downsample = downsample
-        self.mlp_ratio = mlp_ratio
-        self.qkv_bias = qkv_bias
-        self.qk_scale = qk_scale
-        self.drop = drop
-        self.attn_drop = attn_drop
-        self.path_drop = path_drop
-        self.layer_scale = layer_scale
-        self.resize_query = resize_query
-    def build(self, input_shape):
-        path_drop = [self.path_drop] * self.depth if not isinstance(self.path_drop, list) else self.path_drop
-        self.blocks = [
-            GCViTBlock(window_size=self.window_size,
-                      num_heads=self.num_heads,
-                      global_query=bool(i % 2),
-                      mlp_ratio=self.mlp_ratio,
-                      qkv_bias=self.qkv_bias,
-                      qk_scale=self.qk_scale,
-                      drop=self.drop,
-                      attn_drop=self.attn_drop,
-                      path_drop=path_drop[i],
-                      layer_scale=self.layer_scale,
-                      name=f'blocks/{i}')
-            for i in range(self.depth)]
-        self.down = ReduceSize(keep_dim=False, name='downsample')
-        self.to_q_global = [
-            FeatExtract(keep_dim, name=f'to_q_global/{i}')
-            for i, keep_dim in enumerate(self.keep_dims)]
-        self.resize = Resizing(self.window_size, self.window_size, interpolation='bicubic')
-        super().build(input_shape)
-    def call(self, inputs, **kwargs):
-        height, width = tf.unstack(tf.shape(inputs)[1:3], num=2)
-        # pad to multiple of window_size
-        h_pad = (self.window_size - height % self.window_size) % self.window_size
-        w_pad = (self.window_size - width % self.window_size) % self.window_size
-        x = tf.pad(inputs, [[0, 0],
-                            [h_pad//2, (h_pad//2 + h_pad%2)],  # padding in both directions unlike tfgcvit
-                            [w_pad//2, (w_pad//2 + w_pad%2)],
-                            [0, 0]])
-        # generate global query
-        q_global = x  # (B, H, W, C)
-        for layer in self.to_q_global:
-            q_global = layer(q_global)  #  official impl issue: https://github.com/NVlabs/GCVit/issues/13
-        # resize query to fit key-value, but result in poor score with official weights?
-        if self.resize_query:
-            q_global = self.resize(q_global)  # to avoid mismatch between feat_map and q_global: https://github.com/NVlabs/GCVit/issues/9
-        # feature_map -> windows -> window_attention -> feature_map
-        for i, blk in enumerate(self.blocks):
-            if i % 2:
-                x = blk([x, q_global])
-            else:
-                x = blk([x])
-        x = x[:, :height, :width, :]  # https://github.com/NVlabs/GCVit/issues/9
-        # set shape for [B, ?, ?, C]
-        x.set_shape(inputs.shape)  # `tf.reshape` creates new tensor with new_shape
-        # downsample
-        if self.downsample:
-          x = self.down(x)
-        return x
-    def get_config(self):
-        config = super().get_config()
-        config.update({
-            'depth': self.depth,
-            'num_heads': self.num_heads,
-            'window_size': self.window_size,
-            'keep_dims': self.keep_dims,
-            'downsample': self.downsample,
-            'mlp_ratio': self.mlp_ratio,
-            'qkv_bias': self.qkv_bias,
-            'qk_scale': self.qk_scale,
-            'drop': self.drop,
-            'attn_drop': self.attn_drop,
-            'path_drop': self.path_drop,
-            'layer_scale': self.layer_scale
-        })
         return config

+import tensorflow as tf
+from .feature import GlobalQueryGen, ReduceSize, Resizing, FitWindow
+from .block import GCViTBlock
+@tf.keras.utils.register_keras_serializable(package="gcvit")
+class GCViTLevel(tf.keras.layers.Layer):
+    def __init__(self, depth, num_heads, window_size, keep_dims, downsample=True, mlp_ratio=4., qkv_bias=True,
+                qk_scale=None, drop=0., attn_drop=0., path_drop=0., layer_scale=None, resize_query=False, **kwargs):
+        super().__init__(**kwargs)
+        self.depth = depth
+        self.num_heads = num_heads
+        self.window_size = window_size
+        self.keep_dims = keep_dims
+        self.downsample = downsample
+        self.mlp_ratio = mlp_ratio
+        self.qkv_bias = qkv_bias
+        self.qk_scale = qk_scale
+        self.drop = drop
+        self.attn_drop = attn_drop
+        self.path_drop = path_drop
+        self.layer_scale = layer_scale
+        self.resize_query = resize_query
+    def build(self, input_shape):
+        path_drop = [self.path_drop] * self.depth if not isinstance(self.path_drop, list) else self.path_drop
+        self.blocks = [
+            GCViTBlock(window_size=self.window_size,
+                      num_heads=self.num_heads,
+                      global_query=bool(i % 2),
+                      mlp_ratio=self.mlp_ratio,
+                      qkv_bias=self.qkv_bias,
+                      qk_scale=self.qk_scale,
+                      drop=self.drop,
+                      attn_drop=self.attn_drop,
+                      path_drop=path_drop[i],
+                      layer_scale=self.layer_scale,
+                      name=f'blocks/{i}')
+            for i in range(self.depth)]
+        self.down = ReduceSize(keep_dim=False, name='downsample')
+        self.q_global_gen = GlobalQueryGen(self.keep_dims, name='q_global_gen')
+        self.resize = Resizing(self.window_size, self.window_size, interpolation='bicubic')
+        self.fit_window = FitWindow(self.window_size)
+        super().build(input_shape)
+    def call(self, inputs, **kwargs):
+        H, W = tf.unstack(tf.shape(inputs)[1:3], num=2)
+        # pad to fit window_size
+        x = self.fit_window(inputs)
+        # generate global query
+        q_global = self.q_global_gen(x) # (B, H, W, C)  # official impl issue: https://github.com/NVlabs/GCVit/issues/13
+        # resize query to fit key-value, but result in poor score with official weights?
+        if self.resize_query:
+            q_global = self.resize(q_global)  # to avoid mismatch between feat_map and q_global: https://github.com/NVlabs/GCVit/issues/9
+        # feature_map -> windows -> window_attention -> feature_map
+        for i, blk in enumerate(self.blocks):
+            if i % 2:
+                x = blk([x, q_global])
+            else:
+                x = blk([x])
+        x = x[:, :H, :W, :]  # https://github.com/NVlabs/GCVit/issues/9
+        # set shape for [B, ?, ?, C]
+        x.set_shape(inputs.shape)  # `tf.reshape` creates new tensor with new_shape
+        # downsample
+        if self.downsample:
+          x = self.down(x)
+        return x
+    def get_config(self):
+        config = super().get_config()
+        config.update({
+            'depth': self.depth,
+            'num_heads': self.num_heads,
+            'window_size': self.window_size,
+            'keep_dims': self.keep_dims,
+            'downsample': self.downsample,
+            'mlp_ratio': self.mlp_ratio,
+            'qkv_bias': self.qkv_bias,
+            'qk_scale': self.qk_scale,
+            'drop': self.drop,
+            'attn_drop': self.attn_drop,
+            'path_drop': self.path_drop,
+            'layer_scale': self.layer_scale
+        })
         return config

gcvit/models/__pycache__/__init__.cpython-38.pyc DELETED Viewed

Binary file (234 Bytes)

gcvit/models/__pycache__/gcvit.cpython-38.pyc DELETED Viewed

Binary file (4.08 kB)

gcvit/models/gcvit.py CHANGED Viewed

@@ -2,11 +2,25 @@ import numpy as np
 import tensorflow as tf
 from ..layers import Stem, GCViTLevel, Identity
 BASE_URL = 'https://github.com/awsaf49/gcvit-tf/releases/download'
 TAG = 'v1.1.1'
 NAME2CONFIG = {
     'gcvit_xxtiny': {'window_size': (7, 7, 14, 7),
                     'dim': 64,
                     'depths': (2, 2, 6, 2),
@@ -24,6 +38,8 @@ NAME2CONFIG = {
                     'depths': (3, 4, 19, 5),
                     'num_heads': (2, 4, 8, 16),
                     'mlp_ratio': 3.,
                     'path_drop': 0.2,},
     'gcvit_small': {'window_size': (7, 7, 14, 7),
                      'dim': 96,
@@ -70,6 +86,7 @@ class GCViT(tf.keras.Model):
         self.num_classes = num_classes
         self.head_act = head_act
         self.patch_embed = Stem(dim=dim, name='patch_embed')
         self.pos_drop = tf.keras.layers.Dropout(drop_rate, name='pos_drop')
         path_drops = np.linspace(0., path_drop, sum(depths))
@@ -77,6 +94,7 @@ class GCViT(tf.keras.Model):
         self.levels = []
         for i in range(len(depths)):
             path_drop = path_drops[sum(depths[:i]):sum(depths[:i + 1])].tolist()
             level = GCViTLevel(depth=depths[i], num_heads=num_heads[i], window_size=window_size[i], keep_dims=keep_dims[i],
                     downsample=(i < len(depths) - 1), mlp_ratio=mlp_ratio, qkv_bias=qkv_bias, qk_scale=qk_scale,
                     drop=drop_rate, attn_drop=attn_drop, path_drop=path_drop, layer_scale=layer_scale, resize_query=resize_query,
@@ -92,13 +110,17 @@ class GCViT(tf.keras.Model):
         else:
             raise ValueError(f'Expecting pooling to be one of None/avg/max. Found: {global_pool}')
         self.head = tf.keras.layers.Dense(num_classes, name='head', activation=head_act)
     def reset_classifier(self, num_classes, head_act, global_pool=None, in_channels=3):
         self.num_classes = num_classes
         if global_pool is not None:
             self.global_pool = global_pool
         self.head = tf.keras.layers.Dense(num_classes, name='head', activation=head_act) if num_classes else Identity(name='head')
         super().build((1, 224, 224, in_channels)) # for head we only need info from the input channel
     def forward_features(self, inputs):
         x = self.patch_embed(inputs)
@@ -115,6 +137,7 @@ class GCViT(tf.keras.Model):
             x = self.pool(x)
         if not pre_logits:
             x = self.head(x)
         return x
     def call(self, inputs, **kwargs):
@@ -130,6 +153,9 @@ class GCViT(tf.keras.Model):
     def summary(self, input_shape=(224, 224, 3)):
         return self.build_graph(input_shape).summary()
 # load standard models
 def GCViTXXTiny(input_shape=(224, 224, 3), pretrain=False, resize_query=False, **kwargs):
     name = 'gcvit_xxtiny'
@@ -153,28 +179,57 @@ def GCViTXTiny(input_shape=(224, 224, 3), pretrain=False, resize_query=False, **
         model.load_weights(ckpt_path)
     return model
 def GCViTTiny(input_shape=(224, 224, 3), pretrain=False, resize_query=False, **kwargs):
     name = 'gcvit_tiny'
     config = NAME2CONFIG[name]
     ckpt_link = '{}/{}/{}_weights.h5'.format(BASE_URL, TAG, name)
     model = GCViT(name=name, resize_query=resize_query, **config,  **kwargs)
     model(tf.random.uniform(shape=input_shape)[tf.newaxis,])
     if pretrain:
         ckpt_path = tf.keras.utils.get_file('{}_weights.h5'.format(name), ckpt_link)
         model.load_weights(ckpt_path)
     return model
 def GCViTSmall(input_shape=(224, 224, 3), pretrain=False, resize_query=False, **kwargs):
     name = 'gcvit_small'
     config = NAME2CONFIG[name]
     ckpt_link = '{}/{}/{}_weights.h5'.format(BASE_URL, TAG, name)
     model = GCViT(name=name, resize_query=resize_query, **config, **kwargs)
     model(tf.random.uniform(shape=input_shape)[tf.newaxis,])
     if pretrain:
         ckpt_path = tf.keras.utils.get_file('{}_weights.h5'.format(name), ckpt_link)
         model.load_weights(ckpt_path)
     return model
 def GCViTBase(input_shape=(224, 224, 3), pretrain=False, resize_query=False, **kwargs):
     name = 'gcvit_base'
     config = NAME2CONFIG[name]

 import tensorflow as tf
 from ..layers import Stem, GCViTLevel, Identity
+from ..layers import Stem, GCViTLevel, Identity
 BASE_URL = 'https://github.com/awsaf49/gcvit-tf/releases/download'
 TAG = 'v1.1.1'
 NAME2CONFIG = {
+    'gcvit_xxtiny': {'window_size': (7, 7, 14, 7),
+                    'dim': 64,
+                    'depths': (2, 2, 6, 2),
+                    'num_heads': (2, 4, 8, 16),
+                    'mlp_ratio': 3.,
+                    'path_drop': 0.2},
+    'gcvit_xtiny': {'window_size': (7, 7, 14, 7),
+                    'dim': 64,
+                    'depths': (3, 4, 6, 5),
+                    'num_heads': (2, 4, 8, 16),
+                    'mlp_ratio': 3.,
+                    'path_drop': 0.2},
     'gcvit_xxtiny': {'window_size': (7, 7, 14, 7),
                     'dim': 64,
                     'depths': (2, 2, 6, 2),
                     'depths': (3, 4, 19, 5),
                     'num_heads': (2, 4, 8, 16),
                     'mlp_ratio': 3.,
+                    'num_heads': (2, 4, 8, 16),
+                    'mlp_ratio': 3.,
                     'path_drop': 0.2,},
     'gcvit_small': {'window_size': (7, 7, 14, 7),
                      'dim': 96,
         self.num_classes = num_classes
         self.head_act = head_act
+        self.patch_embed = Stem(dim=dim, name='patch_embed')
         self.patch_embed = Stem(dim=dim, name='patch_embed')
         self.pos_drop = tf.keras.layers.Dropout(drop_rate, name='pos_drop')
         path_drops = np.linspace(0., path_drop, sum(depths))
         self.levels = []
         for i in range(len(depths)):
             path_drop = path_drops[sum(depths[:i]):sum(depths[:i + 1])].tolist()
+            level = GCViTLevel(depth=depths[i], num_heads=num_heads[i], window_size=window_size[i], keep_dims=keep_dims[i],
             level = GCViTLevel(depth=depths[i], num_heads=num_heads[i], window_size=window_size[i], keep_dims=keep_dims[i],
                     downsample=(i < len(depths) - 1), mlp_ratio=mlp_ratio, qkv_bias=qkv_bias, qk_scale=qk_scale,
                     drop=drop_rate, attn_drop=attn_drop, path_drop=path_drop, layer_scale=layer_scale, resize_query=resize_query,
         else:
             raise ValueError(f'Expecting pooling to be one of None/avg/max. Found: {global_pool}')
         self.head = tf.keras.layers.Dense(num_classes, name='head', activation=head_act)
+        self.head = tf.keras.layers.Dense(num_classes, name='head', activation=head_act)
+    def reset_classifier(self, num_classes, head_act, global_pool=None, in_channels=3):
     def reset_classifier(self, num_classes, head_act, global_pool=None, in_channels=3):
         self.num_classes = num_classes
         if global_pool is not None:
             self.global_pool = global_pool
         self.head = tf.keras.layers.Dense(num_classes, name='head', activation=head_act) if num_classes else Identity(name='head')
         super().build((1, 224, 224, in_channels)) # for head we only need info from the input channel
+        self.head = tf.keras.layers.Dense(num_classes, name='head', activation=head_act) if num_classes else Identity(name='head')
+        super().build((1, 224, 224, in_channels)) # for head we only need info from the input channel
     def forward_features(self, inputs):
         x = self.patch_embed(inputs)
             x = self.pool(x)
         if not pre_logits:
             x = self.head(x)
+            x = self.head(x)
         return x
     def call(self, inputs, **kwargs):
     def summary(self, input_shape=(224, 224, 3)):
         return self.build_graph(input_shape).summary()
+    def summary(self, input_shape=(224, 224, 3)):
+        return self.build_graph(input_shape).summary()
 # load standard models
 def GCViTXXTiny(input_shape=(224, 224, 3), pretrain=False, resize_query=False, **kwargs):
     name = 'gcvit_xxtiny'
         model.load_weights(ckpt_path)
     return model
+def GCViTTiny(input_shape=(224, 224, 3), pretrain=False, resize_query=False, **kwargs):
+def GCViTXXTiny(input_shape=(224, 224, 3), pretrain=False, resize_query=False, **kwargs):
+    name = 'gcvit_xxtiny'
+    config = NAME2CONFIG[name]
+    ckpt_link = '{}/{}/{}_weights.h5'.format(BASE_URL, TAG, name)
+    model = GCViT(name=name, resize_query=resize_query, **config,  **kwargs)
+    model(tf.random.uniform(shape=input_shape)[tf.newaxis,])
+    if pretrain:
+        ckpt_path = tf.keras.utils.get_file('{}_weights.h5'.format(name), ckpt_link)
+        model.load_weights(ckpt_path)
+    return model
+def GCViTXTiny(input_shape=(224, 224, 3), pretrain=False, resize_query=False, **kwargs):
+    name = 'gcvit_xtiny'
+    config = NAME2CONFIG[name]
+    ckpt_link = '{}/{}/{}_weights.h5'.format(BASE_URL, TAG, name)
+    model = GCViT(name=name, resize_query=resize_query, **config,  **kwargs)
+    model(tf.random.uniform(shape=input_shape)[tf.newaxis,])
+    if pretrain:
+        ckpt_path = tf.keras.utils.get_file('{}_weights.h5'.format(name), ckpt_link)
+        model.load_weights(ckpt_path)
+    return model
 def GCViTTiny(input_shape=(224, 224, 3), pretrain=False, resize_query=False, **kwargs):
     name = 'gcvit_tiny'
     config = NAME2CONFIG[name]
     ckpt_link = '{}/{}/{}_weights.h5'.format(BASE_URL, TAG, name)
     model = GCViT(name=name, resize_query=resize_query, **config,  **kwargs)
     model(tf.random.uniform(shape=input_shape)[tf.newaxis,])
+    model = GCViT(name=name, resize_query=resize_query, **config,  **kwargs)
+    model(tf.random.uniform(shape=input_shape)[tf.newaxis,])
     if pretrain:
         ckpt_path = tf.keras.utils.get_file('{}_weights.h5'.format(name), ckpt_link)
         model.load_weights(ckpt_path)
     return model
+def GCViTSmall(input_shape=(224, 224, 3), pretrain=False, resize_query=False, **kwargs):
 def GCViTSmall(input_shape=(224, 224, 3), pretrain=False, resize_query=False, **kwargs):
     name = 'gcvit_small'
     config = NAME2CONFIG[name]
     ckpt_link = '{}/{}/{}_weights.h5'.format(BASE_URL, TAG, name)
     model = GCViT(name=name, resize_query=resize_query, **config, **kwargs)
     model(tf.random.uniform(shape=input_shape)[tf.newaxis,])
+    model = GCViT(name=name, resize_query=resize_query, **config, **kwargs)
+    model(tf.random.uniform(shape=input_shape)[tf.newaxis,])
     if pretrain:
         ckpt_path = tf.keras.utils.get_file('{}_weights.h5'.format(name), ckpt_link)
         model.load_weights(ckpt_path)
     return model
+def GCViTBase(input_shape=(224, 224, 3), pretrain=False, resize_query=False, **kwargs):
 def GCViTBase(input_shape=(224, 224, 3), pretrain=False, resize_query=False, **kwargs):
     name = 'gcvit_base'
     config = NAME2CONFIG[name]

gcvit/version.py CHANGED Viewed

	@@ -1 +1 @@
1	- __version__ = "1.0.3"


1	+ __version__ = "1.0.9"

requirements.txt CHANGED Viewed

@@ -1,5 +1,5 @@
-tensorflow==2.4.1
-tensorflow_addons==0.14.0
-gradio==3.1.0
-numpy
 matplotlib

+tensorflow==2.4.1
+tensorflow_addons==0.14.0
+gradio==3.1.0
+numpy
 matplotlib

setup.py DELETED Viewed

@@ -1,50 +0,0 @@
-from setuptools import setup, find_packages
-from codecs import open
-from os import path
-here = path.abspath(path.dirname(__file__))
-# Get the long description from the README file
-with open(path.join(here, "README.md"), encoding="utf-8") as f:
-    long_description = f.read()
-with open(path.join(here, 'requirements.txt')) as f:
-    install_requires = [x for x in f.read().splitlines() if len(x)]
-exec(open("gcvit/version.py").read())
-setup(
-    name="gcvit",
-    version=__version__,
-    description="Tensorflow 2.0 Implementation of GCViT: Global Context Vision Transformer. https://github.com/awsaf49/gcvit-tf",
-    long_description=long_description,
-    long_description_content_type="text/markdown",
-    url="https://github.com/awsaf49/gcvit-tf",
-    author="Awsaf",
-    author_email="awsaf49@gmail.com",
-    classifiers=[
-        # How mature is this project? Common values are
-        #   3 - Alpha
-        #   4 - Beta
-        #   5 - Production/Stable
-        "Development Status :: 3 - Alpha",
-        "Intended Audience :: Developers",
-        "Intended Audience :: Science/Research",
-        "License :: OSI Approved :: Apache Software License",
-        "Programming Language :: Python :: 3.6",
-        "Programming Language :: Python :: 3.7",
-        "Programming Language :: Python :: 3.8",
-        "Topic :: Scientific/Engineering",
-        "Topic :: Scientific/Engineering :: Artificial Intelligence",
-        "Topic :: Software Development",
-        "Topic :: Software Development :: Libraries",
-        "Topic :: Software Development :: Libraries :: Python Modules",
-    ],
-    # Note that this is a string of words separated by whitespace, not a list.
-    keywords="tensorflow computer_vision image classification transformer",
-    packages=find_packages(exclude=["tests"]),
-    include_package_data=True,
-    install_requires=install_requires,
-    python_requires=">=3.6",
-    license="MIT",
-)