temporary fix remove dropout from attention layers

priyakasimbeg · priyakasimbeg · commit d1770c22434f · 2025-09-04T16:30:10.000Z
diff --git a/algoperf/workloads/librispeech_conformer/librispeech_jax/models.py b/algoperf/workloads/librispeech_conformer/librispeech_jax/models.py
@@ -428,7 +428,6 @@ def __call__(self, inputs, paddings, train, dropout_rate=DROPOUT_RATE):
       use_bias=True,
       broadcast_dropout=False,
       attention_fn=attention_fn,
-      dropout_rate=dropout_rate,
       deterministic=not train,
     )(inputs_q=inputs, mask=attention_mask)
 
diff --git a/algoperf/workloads/wmt/wmt_jax/models.py b/algoperf/workloads/wmt/wmt_jax/models.py
@@ -223,7 +223,6 @@ def __call__(self, inputs, encoder_mask=None, dropout_rate=DROPOUT_RATE):
       bias_init=cfg.bias_init,
       use_bias=False,
       broadcast_dropout=False,
-      dropout_rate=dropout_rate,
       deterministic=cfg.deterministic,
     )(cfg.attention_temp * x, x, mask=encoder_mask)