jinaai
/

jina-bert-implementation

Inference Endpoints

Model card Files Files and versions Community

Jackmin801 commited on Oct 13, 2023

Commit

bc43a5e

•

1 Parent(s): df1a7f6

allow math kernel

Files changed (1) hide show

modeling_bert.py +1 -1

modeling_bert.py CHANGED Viewed

@@ -378,7 +378,7 @@ class JinaBertSelfAttention(nn.Module):
             b, _, s, _ = query_layer.shape
             new_bias = attention_mask + bias
             attn = scaled_dot_product_attention(query_layer, key_layer, value_layer, new_bias)
-            attn = attn.permute(0, 2, 1, 3)
             return (attn.view(b, s, self.all_head_size),)
         # Take the dot product between "query" and "key" to get the raw attention scores.

             b, _, s, _ = query_layer.shape
             new_bias = attention_mask + bias
             attn = scaled_dot_product_attention(query_layer, key_layer, value_layer, new_bias)
+            attn = attn.permute(0, 2, 1, 3).contiguous()
             return (attn.view(b, s, self.all_head_size),)
         # Take the dot product between "query" and "key" to get the raw attention scores.