zwt123home123
/

13b_V_cache_320

Model card Files Files and versions Community

zwt123home123 commited on Dec 15, 2024

Commit

869bf60

·

verified ·

1 Parent(s): 970e45d

Update modeling_llama.py

Files changed (1) hide show

modeling_llama.py +1 -1

modeling_llama.py CHANGED Viewed

@@ -457,7 +457,7 @@ class LlamaAttention(nn.Module):
         if attn_weights.shape[2]>576:
             # print("loading ... ")
             #print(value_states.shape)
-            self.ae_v.load_state_dict(torch.load("weights_320/"+"autoencoder_epoch_1_L1_1280_nonorm_layer_"+str(self.layer_idx)+".pth", map_location='cuda'))
             value_states_v = value_states[:,:,35:35+576,:]
             value_states_v = value_states_v.permute(0, 2, 1, 3)
             value_states_v=value_states_v.reshape(value_states_v.shape[0],value_states_v.shape[1],5120)

         if attn_weights.shape[2]>576:
             # print("loading ... ")
             #print(value_states.shape)
+            self.ae_v.load_state_dict(torch.load("weights_320/"+"autoencoder_epoch_1_L1_nonorm_layer_"+str(self.layer_idx)+".pth", map_location='cuda'))
             value_states_v = value_states[:,:,35:35+576,:]
             value_states_v = value_states_v.permute(0, 2, 1, 3)
             value_states_v=value_states_v.reshape(value_states_v.shape[0],value_states_v.shape[1],5120)