From b2d99df56eca8a189db74d9a0eb1a93f09141977 Mon Sep 17 00:00:00 2001 From: Sravana Neeli Date: Mon, 3 Feb 2025 10:25:24 -0800 Subject: [PATCH 1/2] add missing dropout_rate argument to MLP layer --- keras_hub/src/models/vit/vit_layers.py | 1 + 1 file changed, 1 insertion(+) diff --git a/keras_hub/src/models/vit/vit_layers.py b/keras_hub/src/models/vit/vit_layers.py index f3509440d..c6a8664b0 100644 --- a/keras_hub/src/models/vit/vit_layers.py +++ b/keras_hub/src/models/vit/vit_layers.py @@ -257,6 +257,7 @@ def build(self, input_shape): hidden_dim=self.hidden_dim, mlp_dim=self.mlp_dim, use_bias=self.use_mlp_bias, + dropout_rate=self.dropout_rate, name="mlp", dtype=self.dtype_policy, ) From eea9da7a249a4b81e3efd198edccfad0e84e3b90 Mon Sep 17 00:00:00 2001 From: Sravana Neeli Date: Mon, 3 Feb 2025 13:16:44 -0800 Subject: [PATCH 2/2] dropout layer missing as per official implementation --- keras_hub/src/models/vit/vit_layers.py | 1 + 1 file changed, 1 insertion(+) diff --git a/keras_hub/src/models/vit/vit_layers.py b/keras_hub/src/models/vit/vit_layers.py index c6a8664b0..473cb9cb6 100644 --- a/keras_hub/src/models/vit/vit_layers.py +++ b/keras_hub/src/models/vit/vit_layers.py @@ -65,6 +65,7 @@ def build(self, input_shape): def call(self, inputs): x = self.dense_1(inputs) + x = self.dropout(x) x = self.dense_2(x) out = self.dropout(x) return out