Spaces:

zetavg
/

LLaMA-LoRA-Tuner-UI-Demo

Runtime error

App Files Files Community

zetavg commited on Apr 18, 2023

Commit

db1ee85

1 Parent(s): 469dc51

fix "operation not supported" while flagging and use different log files for different models

Browse files

Files changed (2) hide show

llama_lora/lib/csv_logger.py +96 -0
llama_lora/ui/inference_ui.py +20 -4

llama_lora/lib/csv_logger.py ADDED Viewed

	@@ -0,0 +1,96 @@

+from gradio import FlaggingCallback, utils
+import csv
+import datetime
+import os
+import re
+import secrets
+from pathlib import Path
+from typing import Any, List
+class CSVLogger(FlaggingCallback):
+    """
+    The default implementation of the FlaggingCallback abstract class. Each flagged
+    sample (both the input and output data) is logged to a CSV file with headers on the machine running the gradio app.
+    Example:
+        import gradio as gr
+        def image_classifier(inp):
+            return {'cat': 0.3, 'dog': 0.7}
+        demo = gr.Interface(fn=image_classifier, inputs="image", outputs="label",
+                            flagging_callback=CSVLogger())
+    Guides: using_flagging
+    """
+    def __init__(self):
+        pass
+    def setup(
+        self,
+        components: List[Any],
+        flagging_dir: str | Path,
+    ):
+        self.components = components
+        self.flagging_dir = flagging_dir
+        os.makedirs(flagging_dir, exist_ok=True)
+    def flag(
+        self,
+        flag_data: List[Any],
+        flag_option: str = "",
+        username: str | None = None,
+        filename="log.csv",
+    ) -> int:
+        flagging_dir = self.flagging_dir
+        filename = re.sub(r"[/\\?%*:|\"<>\x7F\x00-\x1F]", "-", filename)
+        log_filepath = Path(flagging_dir) / filename
+        is_new = not Path(log_filepath).exists()
+        headers = [
+            getattr(component, "label", None) or f"component {idx}"
+            for idx, component in enumerate(self.components)
+        ] + [
+            "flag",
+            "username",
+            "timestamp",
+        ]
+        csv_data = []
+        for idx, (component, sample) in enumerate(zip(self.components, flag_data)):
+            save_dir = Path(
+                flagging_dir
+            ) / (
+                getattr(component, "label", None) or f"component {idx}"
+            )
+            if utils.is_update(sample):
+                csv_data.append(str(sample))
+            else:
+                csv_data.append(
+                    component.deserialize(sample, save_dir=save_dir)
+                    if sample is not None
+                    else ""
+                )
+        csv_data.append(flag_option)
+        csv_data.append(username if username is not None else "")
+        csv_data.append(str(datetime.datetime.now()))
+        try:
+            with open(log_filepath, "a", newline="", encoding="utf-8") as csvfile:
+                writer = csv.writer(csvfile)
+                if is_new:
+                    writer.writerow(utils.sanitize_list_for_csv(headers))
+                writer.writerow(utils.sanitize_list_for_csv(csv_data))
+        except Exception as e:
+            # workaround "OSError: [Errno 95] Operation not supported" with open(log_filepath, "a") on some cloud mounted directory
+            random_hex = secrets.token_hex(16)
+            tmp_log_filepath = str(log_filepath) + f".tmp_{random_hex}"
+            with open(tmp_log_filepath, "a", newline="", encoding="utf-8") as csvfile:
+                writer = csv.writer(csvfile)
+                if is_new:
+                    writer.writerow(utils.sanitize_list_for_csv(headers))
+                writer.writerow(utils.sanitize_list_for_csv(csv_data))
+            os.system(f"mv '{log_filepath}' '{log_filepath}.old_{random_hex}'")
+            os.system(f"cat '{log_filepath}.old_{random_hex}' '{tmp_log_filepath}' > '{log_filepath}'")
+            os.system(f"rm '{tmp_log_filepath}'")
+            os.system(f"rm '{log_filepath}.old_{random_hex}'")
+        with open(log_filepath, "r", encoding="utf-8") as csvfile:
+            line_count = len([None for row in csv.reader(csvfile)]) - 1
+        return line_count

llama_lora/ui/inference_ui.py CHANGED Viewed

@@ -10,6 +10,7 @@ from transformers import GenerationConfig
 from ..globals import Global
 from ..models import get_model, get_tokenizer, get_device
 from ..lib.inference import generate
 from ..utils.data import (
     get_available_template_names,
     get_available_lora_model_names,
@@ -320,7 +321,7 @@ def inference_ui():
     if not os.path.exists(flagging_dir):
         os.makedirs(flagging_dir)
-    flag_callback = gr.CSVLogger()
     flag_components = [
         LoggingItem("Base Model"),
         LoggingItem("Adaptor Model"),
@@ -366,6 +367,18 @@ def inference_ui():
             json.dumps(output_for_flagging.get("generation_config", "")),
         ]
     things_that_might_timeout = []
     with gr.Blocks() as inference_ui_blocks:
@@ -510,7 +523,8 @@ def inference_ui():
                             lambda d: (flag_callback.flag(
                                 get_flag_callback_args(d, "Flag"),
                                 flag_option="Flag",
-                                username=None
                             ), "")[1],
                             inputs=[output_for_flagging],
                             outputs=[flag_output],
@@ -519,7 +533,8 @@ def inference_ui():
                             lambda d: (flag_callback.flag(
                                 get_flag_callback_args(d, "👍"),
                                 flag_option="Up Vote",
-                                username=None
                             ), "")[1],
                             inputs=[output_for_flagging],
                             outputs=[flag_output],
@@ -528,7 +543,8 @@ def inference_ui():
                             lambda d: (flag_callback.flag(
                                 get_flag_callback_args(d, "👎"),
                                 flag_option="Down Vote",
-                                username=None
                             ), "")[1],
                             inputs=[output_for_flagging],
                             outputs=[flag_output],

 from ..globals import Global
 from ..models import get_model, get_tokenizer, get_device
 from ..lib.inference import generate
+from ..lib.csv_logger import CSVLogger
 from ..utils.data import (
     get_available_template_names,
     get_available_lora_model_names,
     if not os.path.exists(flagging_dir):
         os.makedirs(flagging_dir)
+    flag_callback = CSVLogger()
     flag_components = [
         LoggingItem("Base Model"),
         LoggingItem("Adaptor Model"),
             json.dumps(output_for_flagging.get("generation_config", "")),
         ]
+    def get_flag_filename(output_for_flagging_str):
+        output_for_flagging = json.loads(output_for_flagging_str)
+        base_model = output_for_flagging.get("base_model", None)
+        adaptor_model = output_for_flagging.get("adaptor_model", None)
+        if adaptor_model == "None":
+            adaptor_model = None
+        if not base_model:
+            return "log.csv"
+        if not adaptor_model:
+            return f"log-{base_model}.csv"
+        return f"log-{base_model}#{adaptor_model}.csv"
     things_that_might_timeout = []
     with gr.Blocks() as inference_ui_blocks:
                             lambda d: (flag_callback.flag(
                                 get_flag_callback_args(d, "Flag"),
                                 flag_option="Flag",
+                                username=None,
+                                filename=get_flag_filename(d)
                             ), "")[1],
                             inputs=[output_for_flagging],
                             outputs=[flag_output],
                             lambda d: (flag_callback.flag(
                                 get_flag_callback_args(d, "👍"),
                                 flag_option="Up Vote",
+                                username=None,
+                                filename=get_flag_filename(d)
                             ), "")[1],
                             inputs=[output_for_flagging],
                             outputs=[flag_output],
                             lambda d: (flag_callback.flag(
                                 get_flag_callback_args(d, "👎"),
                                 flag_option="Down Vote",
+                                username=None,
+                                filename=get_flag_filename(d)
                             ), "")[1],
                             inputs=[output_for_flagging],
                             outputs=[flag_output],