Spaces:

ronaldahmed
/

my_perplexity

Runtime error

ronald commited on Oct 9, 2022

Commit

76cc74c

1 Parent(s): abd4226

cache dir

Files changed (2) hide show

app.py CHANGED Viewed

@@ -1,6 +1,6 @@
 import evaluate
 from evaluate.utils import launch_gradio_widget
-# CACHE_DIR="/gfs/team/nlp/users/rcardena/tools/huggingface/evaluate"
-module = evaluate.load("my_perplexity", module_type="measurement")#,cache_dir=CACHE_DIR)
 launch_gradio_widget(module)

 import evaluate
 from evaluate.utils import launch_gradio_widget
+CACHE_DIR="/gfs/team/nlp/users/rcardena/tools/huggingface/evaluate"
+module = evaluate.load("my_perplexity", module_type="measurement",cache_dir=CACHE_DIR)
 launch_gradio_widget(module)

my_perplexity.py CHANGED Viewed

@@ -106,7 +106,6 @@ class MyPerplexity(evaluate.Measurement):
     def _compute(self, predictions, model_id, batch_size: int = 16, add_start_token: bool = True, device=None):
-        # CACHE_DIR="/gfs/team/nlp/users/rcardena/tools/huggingface/evaluate"
         if device is not None:
             assert device in ["gpu", "cpu", "cuda"], "device should be either gpu or cpu."
             if device == "gpu":
@@ -114,12 +113,12 @@ class MyPerplexity(evaluate.Measurement):
         else:
             device = "cuda" if torch.cuda.is_available() else "cpu"
-        model = AutoModelForCausalLM.from_pretrained(model_id)#,cache_dir=CACHE_DIR)
         model = model.to(device)
         tokenizer = AutoTokenizer.from_pretrained(
                             model_id,
-                            # cache_dir=CACHE_DIR,
                             use_fast="cnn_dailymail" not in model_id,
                             )

     def _compute(self, predictions, model_id, batch_size: int = 16, add_start_token: bool = True, device=None):
         if device is not None:
             assert device in ["gpu", "cpu", "cuda"], "device should be either gpu or cpu."
             if device == "gpu":
         else:
             device = "cuda" if torch.cuda.is_available() else "cpu"
+        model = AutoModelForCausalLM.from_pretrained(model_id,cache_dir=self.cache_dir)
         model = model.to(device)
         tokenizer = AutoTokenizer.from_pretrained(
                             model_id,
+                            cache_dir=self.cache_dir,
                             use_fast="cnn_dailymail" not in model_id,
                             )