magicslabnu
/

clip_softmax_opt125m

Text Generation

text-generation-inference

Inference Endpoints

Model card Files Files and versions Community

robinzixuan commited on Jun 15, 2024

Commit

4776224

·

verified ·

1 Parent(s): 3fe86b3

Upload modeling_opt.py

Files changed (1) hide show

modeling_opt.py +4 -4

modeling_opt.py CHANGED Viewed

@@ -201,10 +201,10 @@ class OPTAttention(nn.Module):
         self.scaling = self.head_dim**-0.5
         self.is_decoder = is_decoder
-        self.k_proj = nn.Linear(embed_dim, embed_dim, bias=bias)
-        self.v_proj = nn.Linear(embed_dim, embed_dim, bias=bias)
-        self.q_proj = nn.Linear(embed_dim, embed_dim, bias=bias)
-        self.out_proj = nn.Linear(embed_dim, embed_dim, bias=bias)
         # YB: capture the input and output of the softmax
         self.attn_scores = nn.Identity()  # before attention mask

         self.scaling = self.head_dim**-0.5
         self.is_decoder = is_decoder
+        self.k_proj = nn.Linear(self.embed_dim, self.embed_dim, bias=bias)
+        self.v_proj = nn.Linear(self.embed_dim, self.embed_dim, bias=bias)
+        self.q_proj = nn.Linear(self.embed_dim, self.embed_dim, bias=bias)
+        self.out_proj = nn.Linear(self.embed_dim, self.embed_dim, bias=bias)
         # YB: capture the input and output of the softmax
         self.attn_scores = nn.Identity()  # before attention mask