Spaces:

karthi311
/

medical_soap

Runtime error

App Files Files Community

karthi311 commited on Dec 10, 2024

Commit

4d605d9

verified ·

1 Parent(s): 6c2aa57

Update app.py

Browse files

Files changed (1) hide show

app.py +10 -32

app.py CHANGED Viewed

@@ -1,12 +1,11 @@
 import torch
 import gradio as gr
-from transformers import AutoProcessor, AutoModelForImageTextToText, pipeline,AutoTokenizer, AutoModelForSeq2SeqLM
 from pydub import AudioSegment
 from sentence_transformers import SentenceTransformer, util
 import spacy
-spacy.cli.download("en_core_web_sm")
 import json
-from faster_whisper import WhisperModel
 # Audio conversion from MP4 to MP3
 def convert_mp4_to_mp3(mp4_path, mp3_path):
@@ -16,7 +15,6 @@ def convert_mp4_to_mp3(mp4_path, mp3_path):
     except Exception as e:
         raise RuntimeError(f"Error converting MP4 to MP3: {e}")
 # Check if CUDA is available for GPU acceleration
 if torch.cuda.is_available():
     device = "cuda"
@@ -25,13 +23,11 @@ else:
     device = "cpu"
     compute_type = "int8"
 # Load Faster Whisper Model for transcription
 def load_faster_whisper():
     model = WhisperModel("deepdml/faster-whisper-large-v3-turbo-ct2", device=device, compute_type=compute_type)
     return model
 # Load NLP model and other helpers
 nlp = spacy.load("en_core_web_sm")
 embedder = SentenceTransformer("all-MiniLM-L6-v2")
@@ -41,7 +37,6 @@ model = AutoModelForSeq2SeqLM.from_pretrained("Mahalingam/DistilBart-Med-Summary
 summarizer = pipeline("summarization", model=model, tokenizer=tokenizer)
 soap_prompts = {
     "subjective": "Personal reports, symptoms described by patients, or personal health concerns. Details reflecting individual symptoms or health descriptions.",
     "objective": "Observable facts, clinical findings, professional observations, specific medical specialties, and diagnoses.",
@@ -50,23 +45,15 @@ soap_prompts = {
 }
 soap_embeddings = {section: embedder.encode(prompt, convert_to_tensor=True) for section, prompt in soap_prompts.items()}
-# Load llava model and processor
-processor = AutoProcessor.from_pretrained("llava-hf/llava-v1.6-mistral-7b-hf")
-model = AutoModelForImageTextToText.from_pretrained("llava-hf/llava-v1.6-mistral-7b-hf")
-# Query function for LLAVA
-def llava_query(user_prompt, soap_note):
     combined_prompt = f"User Instructions:\n{user_prompt}\n\nContext:\n{soap_note}"
     try:
-        inputs = processor(combined_prompt, return_tensors="pt", padding=True)
-        outputs = model.generate(**inputs)
-        return processor.decode(outputs[0], skip_special_tokens=True)
     except Exception as e:
         return f"Error generating response: {e}"
 # Convert the response to JSON format
 def convert_to_json(template):
     try:
@@ -83,7 +70,6 @@ def convert_to_json(template):
     except Exception as e:
         return f"Error converting to JSON: {e}"
 # Transcription using Faster Whisper
 def transcribe_audio(mp4_path):
     try:
@@ -99,13 +85,11 @@ def transcribe_audio(mp4_path):
     except Exception as e:
         return f"Error during transcription: {e}"
 # Classify the sentence to the correct SOAP section
 def classify_sentence(sentence):
     similarities = {section: util.pytorch_cos_sim(embedder.encode(sentence), soap_embeddings[section]) for section in soap_prompts.keys()}
     return max(similarities, key=similarities.get)
 # Summarize the section if it's too long
 def summarize_section(section_text):
     if len(section_text.split()) < 50:
@@ -121,7 +105,6 @@ def summarize_section(section_text):
     )
     return tokenizer.decode(summary_ids[0], skip_special_tokens=True)
 # Analyze the SOAP content and divide into sections
 def soap_analysis(text):
     doc = nlp(text)
@@ -137,7 +120,6 @@ def soap_analysis(text):
     return format_soap_output(soap_note)
 # Format the SOAP note output
 def format_soap_output(soap_note):
     return (
@@ -147,7 +129,6 @@ def format_soap_output(soap_note):
         f"Plan:\n{soap_note['plan']}\n"
     )
 # Process file function for audio to SOAP
 def process_file(mp4_file, user_prompt):
     transcription = transcribe_audio(mp4_file.name)
@@ -156,26 +137,24 @@ def process_file(mp4_file, user_prompt):
     soap_note = soap_analysis(transcription)
     print("SOAP Notes: ", soap_note)
-    template_output = llava_query(user_prompt, soap_note)
     print("Template: ", template_output)
     json_output = convert_to_json(template_output)
     return soap_note, template_output, json_output
 # Process text function for text input to SOAP
 def process_text(text, user_prompt):
     soap_note = soap_analysis(text)
     print(soap_note)
-    template_output = llava_query(user_prompt, soap_note)
     print(template_output)
     json_output = convert_to_json(template_output)
     return soap_note, template_output, json_output
 # Launch the Gradio interface
 def launch_gradio():
     with gr.Blocks(theme=gr.themes.Default()) as demo:
@@ -189,7 +168,7 @@ def launch_gradio():
                 ],
                 outputs=[
                     gr.Textbox(label="SOAP Note"),
-                    gr.Textbox(label="Generated Template from LLAVA"),
                     gr.Textbox(label="JSON Output"),
                 ],
             )
@@ -202,13 +181,12 @@ def launch_gradio():
                 ],
                 outputs=[
                     gr.Textbox(label="SOAP Note"),
-                    gr.Textbox(label="Generated Template from LLAVA"),
                     gr.Textbox(label="JSON Output"),
                 ],
             )
     demo.launch(share=True, debug=True)
 # Run the Gradio app
 if __name__ == "__main__":
     launch_gradio()

 import torch
 import gradio as gr
+from transformers import pipeline, AutoTokenizer, AutoModelForSeq2SeqLM
 from pydub import AudioSegment
 from sentence_transformers import SentenceTransformer, util
 import spacy
 import json
+import ollama
 # Audio conversion from MP4 to MP3
 def convert_mp4_to_mp3(mp4_path, mp3_path):
     except Exception as e:
         raise RuntimeError(f"Error converting MP4 to MP3: {e}")
 # Check if CUDA is available for GPU acceleration
 if torch.cuda.is_available():
     device = "cuda"
     device = "cpu"
     compute_type = "int8"
 # Load Faster Whisper Model for transcription
 def load_faster_whisper():
     model = WhisperModel("deepdml/faster-whisper-large-v3-turbo-ct2", device=device, compute_type=compute_type)
     return model
 # Load NLP model and other helpers
 nlp = spacy.load("en_core_web_sm")
 embedder = SentenceTransformer("all-MiniLM-L6-v2")
 summarizer = pipeline("summarization", model=model, tokenizer=tokenizer)
 soap_prompts = {
     "subjective": "Personal reports, symptoms described by patients, or personal health concerns. Details reflecting individual symptoms or health descriptions.",
     "objective": "Observable facts, clinical findings, professional observations, specific medical specialties, and diagnoses.",
 }
 soap_embeddings = {section: embedder.encode(prompt, convert_to_tensor=True) for section, prompt in soap_prompts.items()}
+# Ollama Llama 2 Model Query function
+def ollama_query(user_prompt, soap_note):
     combined_prompt = f"User Instructions:\n{user_prompt}\n\nContext:\n{soap_note}"
     try:
+        response = ollama.run("llama2:7b-uncensored", prompt=combined_prompt)
+        return response
     except Exception as e:
         return f"Error generating response: {e}"
 # Convert the response to JSON format
 def convert_to_json(template):
     try:
     except Exception as e:
         return f"Error converting to JSON: {e}"
 # Transcription using Faster Whisper
 def transcribe_audio(mp4_path):
     try:
     except Exception as e:
         return f"Error during transcription: {e}"
 # Classify the sentence to the correct SOAP section
 def classify_sentence(sentence):
     similarities = {section: util.pytorch_cos_sim(embedder.encode(sentence), soap_embeddings[section]) for section in soap_prompts.keys()}
     return max(similarities, key=similarities.get)
 # Summarize the section if it's too long
 def summarize_section(section_text):
     if len(section_text.split()) < 50:
     )
     return tokenizer.decode(summary_ids[0], skip_special_tokens=True)
 # Analyze the SOAP content and divide into sections
 def soap_analysis(text):
     doc = nlp(text)
     return format_soap_output(soap_note)
 # Format the SOAP note output
 def format_soap_output(soap_note):
     return (
         f"Plan:\n{soap_note['plan']}\n"
     )
 # Process file function for audio to SOAP
 def process_file(mp4_file, user_prompt):
     transcription = transcribe_audio(mp4_file.name)
     soap_note = soap_analysis(transcription)
     print("SOAP Notes: ", soap_note)
+    template_output = ollama_query(user_prompt, soap_note)
     print("Template: ", template_output)
     json_output = convert_to_json(template_output)
     return soap_note, template_output, json_output
 # Process text function for text input to SOAP
 def process_text(text, user_prompt):
     soap_note = soap_analysis(text)
     print(soap_note)
+    template_output = ollama_query(user_prompt, soap_note)
     print(template_output)
     json_output = convert_to_json(template_output)
     return soap_note, template_output, json_output
 # Launch the Gradio interface
 def launch_gradio():
     with gr.Blocks(theme=gr.themes.Default()) as demo:
                 ],
                 outputs=[
                     gr.Textbox(label="SOAP Note"),
+                    gr.Textbox(label="Generated Template from Llama 2"),
                     gr.Textbox(label="JSON Output"),
                 ],
             )
                 ],
                 outputs=[
                     gr.Textbox(label="SOAP Note"),
+                    gr.Textbox(label="Generated Template from Llama 2"),
                     gr.Textbox(label="JSON Output"),
                 ],
             )
     demo.launch(share=True, debug=True)
 # Run the Gradio app
 if __name__ == "__main__":
     launch_gradio()