Spaces:

oceansweep
/

tldw

Sleeping

App Files Files Community

oceansweep commited on Sep 2

Commit

c96320d

•

1 Parent(s): cd5e862

Upload Confabulation_check.py

Browse files

Files changed (1) hide show

App_Function_Libraries/Confabulation_check.py +81 -0

App_Function_Libraries/Confabulation_check.py ADDED Viewed

	@@ -0,0 +1,81 @@

+# Confabulation_check.py
+#
+# This file contains the functions that are used to check the confabulation of the user's input.
+#
+#
+# Imports
+#
+# External Imports
+#
+# Local Imports
+#
+#
+####################################################################################################
+#
+# Functions:
+from App_Function_Libraries.Chat import chat_api_call
+from App_Function_Libraries.ms_g_eval import validate_inputs, detailed_api_error
+def simplified_geval(transcript: str, summary: str, api_name: str, api_key: str, temp: float = 0.7) -> str:
+    """
+    Perform a simplified version of G-Eval using a single query to evaluate the summary.
+    Args:
+        transcript (str): The original transcript
+        summary (str): The summary to be evaluated
+        api_name (str): The name of the LLM API to use
+        api_key (str): The API key for the chosen LLM
+        temp (float, optional): The temperature parameter for the API call. Defaults to 0.7.
+    Returns:
+        str: The evaluation result
+    """
+    try:
+        validate_inputs(transcript, summary, api_name, api_key)
+    except ValueError as e:
+        return str(e)
+    prompt = f"""You are an AI assistant tasked with evaluating the quality of a summary. You will be given an original transcript and a summary of that transcript. Your task is to evaluate the summary based on the following criteria:
+1. Coherence (1-5): How well-structured and organized is the summary?
+2. Consistency (1-5): How factually aligned is the summary with the original transcript?
+3. Fluency (1-3): How well-written is the summary in terms of grammar, spelling, and readability?
+4. Relevance (1-5): How well does the summary capture the important information from the transcript?
+Please provide a score for each criterion and a brief explanation for your scoring. Then, give an overall assessment of the summary's quality.
+Original Transcript:
+{transcript}
+Summary to Evaluate:
+{summary}
+Please provide your evaluation in the following format:
+Coherence: [score] - [brief explanation]
+Consistency: [score] - [brief explanation]
+Fluency: [score] - [brief explanation]
+Relevance: [score] - [brief explanation]
+Overall Assessment: [Your overall assessment of the summary's quality]
+"""
+    try:
+        result = chat_api_call(
+            api_name,
+            api_key,
+            prompt,
+            "",
+            temp=temp,
+            system_message="You are a helpful AI assistant tasked with evaluating summaries."
+        )
+    except Exception as e:
+        return detailed_api_error(api_name, e)
+    formatted_result = f"""
+    Confabulation Check Results:
+    {result}
+    """
+    return formatted_result