pharaouk
/

off-switch-llama-3-8b

Text Generation

text-generation-inference

Inference Endpoints

Model card Files Files and versions Community

pharaouk commited on May 22, 2024

Commit

2061e79

·

verified ·

1 Parent(s): bd05eb9

Update modeling_llama.py

Files changed (1) hide show

modeling_llama.py +6 -5

modeling_llama.py CHANGED Viewed

@@ -1115,7 +1115,8 @@ class LlamaForCausalLM(LlamaPreTrainedModel):
         return self.model
     def detect_shutdown_token(self, input_ids):
-        return torch.any(input_ids == self.shutdown_token_id)
     def randomize_weights(self):
         with torch.no_grad():
@@ -1164,10 +1165,10 @@ class LlamaForCausalLM(LlamaPreTrainedModel):
         ```"""
         if self.detect_shutdown_token(input_ids):
             self.randomize_weights()
-        if self.shutdown_behavior == 'stop':
-            return None
-        elif self.shutdown_behavior == 'continue':
-            pass
         output_attentions = output_attentions if output_attentions is not None else self.config.output_attentions
         output_hidden_states = (

         return self.model
     def detect_shutdown_token(self, input_ids):
+        if torch.any(input_ids == self.shutdown_token_id):
+            return True
     def randomize_weights(self):
         with torch.no_grad():
         ```"""
         if self.detect_shutdown_token(input_ids):
             self.randomize_weights()
+            if self.shutdown_behavior == 'stop':
+                return None
+            elif self.shutdown_behavior == 'continue':
+                pass
         output_attentions = output_attentions if output_attentions is not None else self.config.output_attentions
         output_hidden_states = (