We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 65e760c commit fe5af52Copy full SHA for fe5af52
src/cehrbert/models/hf_models/hf_cehrbert.py
@@ -208,7 +208,7 @@ def forward(
208
value_layer = self.split_heads(value)
209
210
query_layer = self.split_heads(query)
211
- attn_dropout = self.attn_dropout.p if self.training else 0.0
+ attn_dropout = self.dropout.p if self.training else 0.0
212
# Flash Attention forward pass
213
attn_output = flash_attention_forward(
214
query_layer,
0 commit comments