Spaces:

Rohith1112
/

ICLINIQ

Running

App Files Files Community

Rohith1112 commited on 16 days ago

Commit

aff94f6

verified ·

1 Parent(s): 28f8c56

u

Browse files

Files changed (1) hide show

app.py +79 -32

app.py CHANGED Viewed

@@ -4,9 +4,11 @@ import torch
 from transformers import AutoTokenizer, AutoModelForCausalLM
 import gradio as gr
 import matplotlib.pyplot as plt
 # Model setup
-device = torch.device('cpu')  # Use 'cuda' if GPU is available
 dtype = torch.float32
 model_name_or_path = 'GoodBaiBai88/M3D-LaMed-Phi-3-4B'
 proj_out_num = 256
@@ -14,8 +16,8 @@ proj_out_num = 256
 # Load model and tokenizer
 model = AutoModelForCausalLM.from_pretrained(
     model_name_or_path,
-    torch_dtype=torch.float32,
-    device_map='cpu',
     trust_remote_code=True
 )
@@ -27,43 +29,50 @@ tokenizer = AutoTokenizer.from_pretrained(
     trust_remote_code=True
 )
 # Chat history storage
 chat_history = []
 current_image = None
 def extract_and_display_images(image_path):
-    npy_data = np.load(image_path)
-    if npy_data.ndim == 4 and npy_data.shape[1] == 32:
-        npy_data = npy_data[0]
-    elif npy_data.ndim != 3 or npy_data.shape[0] != 32:
-        return "Invalid .npy file format. Expected shape (1, 32, 256, 256) or (32, 256, 256)."
-    fig, axes = plt.subplots(4, 8, figsize=(12, 6))
-    for i, ax in enumerate(axes.flat):
-        ax.imshow(npy_data[i], cmap='gray')
-        ax.axis('off')
-    image_output = "extracted_images.png"
-    plt.savefig(image_output, bbox_inches='tight')
-    plt.close()
-    return image_output
 def process_image(question):
     global current_image
     if current_image is None:
         return "Please upload an image first."
-    image_np = np.load(current_image)
-    image_tokens = "<im_patch>" * proj_out_num
-    input_txt = image_tokens + question
-    input_id = tokenizer(input_txt, return_tensors="pt")['input_ids'].to(device=device)
-    image_pt = torch.from_numpy(image_np).unsqueeze(0).to(dtype=dtype, device=device)
-    generation = model.generate(image_pt, input_id, max_new_tokens=256, do_sample=True, top_p=0.9, temperature=1.0)
-    generated_texts = tokenizer.batch_decode(generation, skip_special_tokens=True)
-    return generated_texts[0]
 def chat_interface(question):
     global chat_history
@@ -71,16 +80,51 @@ def chat_interface(question):
     chat_history.append((question, response))
     return chat_history
 def upload_image(image):
     global current_image
     current_image = image.name
     extracted_image_path = extract_and_display_images(current_image)
     return "Image uploaded and processed successfully!", extracted_image_path
 # Gradio UI
 with gr.Blocks(theme=gr.themes.Soft()) as chat_ui:
-    gr.Markdown("# 🏥 AI-Powered Medical Image Analysis Chatbot")
     with gr.Row():
         with gr.Column(scale=1, min_width=200):
             chat_list = gr.Chatbot(value=[], label="Chat History", elem_id="chat-history")
@@ -95,4 +139,7 @@ with gr.Blocks(theme=gr.themes.Soft()) as chat_ui:
     submit_button.click(chat_interface, question_input, chat_list)
     question_input.submit(chat_interface, question_input, chat_list)
-chat_ui.launch()

 from transformers import AutoTokenizer, AutoModelForCausalLM
 import gradio as gr
 import matplotlib.pyplot as plt
+from datasets import load_dataset
+from evaluate import load  # For evaluation metrics
 # Model setup
+device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')  # Use GPU if available
 dtype = torch.float32
 model_name_or_path = 'GoodBaiBai88/M3D-LaMed-Phi-3-4B'
 proj_out_num = 256
 # Load model and tokenizer
 model = AutoModelForCausalLM.from_pretrained(
     model_name_or_path,
+    torch_dtype=dtype,
+    device_map=device.type,
     trust_remote_code=True
 )
     trust_remote_code=True
 )
+# Load the M3D-Cap dataset
+dataset = load_dataset("GoodBaiBai88/M3D-Cap")
 # Chat history storage
 chat_history = []
 current_image = None
 def extract_and_display_images(image_path):
+    try:
+        npy_data = np.load(image_path)
+        if npy_data.ndim == 4 and npy_data.shape[1] == 32:
+            npy_data = npy_data[0]
+        elif npy_data.ndim != 3 or npy_data.shape[0] != 32:
+            return "Invalid .npy file format. Expected shape (1, 32, 256, 256) or (32, 256, 256)."
+        fig, axes = plt.subplots(4, 8, figsize=(12, 6))
+        for i, ax in enumerate(axes.flat):
+            ax.imshow(npy_data[i], cmap='gray')
+            ax.axis('off')
+        image_output = "extracted_images.png"
+        plt.savefig(image_output, bbox_inches='tight')
+        plt.close()
+        return image_output
+    except Exception as e:
+        return f"Error processing image: {str(e)}"
 def process_image(question):
     global current_image
     if current_image is None:
         return "Please upload an image first."
+    try:
+        image_np = np.load(current_image)
+        image_tokens = "<im_patch>" * proj_out_num
+        input_txt = image_tokens + question
+        input_id = tokenizer(input_txt, return_tensors="pt")['input_ids'].to(device=device)
+        image_pt = torch.from_numpy(image_np).unsqueeze(0).to(dtype=dtype, device=device)
+        generation = model.generate(image_pt, input_id, max_new_tokens=256, do_sample=True, top_p=0.9, temperature=1.0)
+        generated_texts = tokenizer.batch_decode(generation, skip_special_tokens=True)
+        return generated_texts[0]
+    except Exception as e:
+        return f"Error generating response: {str(e)}"
 def chat_interface(question):
     global chat_history
     chat_history.append((question, response))
     return chat_history
 def upload_image(image):
     global current_image
     current_image = image.name
     extracted_image_path = extract_and_display_images(current_image)
     return "Image uploaded and processed successfully!", extracted_image_path
+def test_model_with_dataset():
+    # Load evaluation metrics
+    bleu = load("bleu")
+    rouge = load("rouge")
+    # Initialize lists to store predictions and references
+    predictions = []
+    references = []
+    # Iterate over the dataset
+    for example in dataset['train']:  # Use 'train', 'validation', or 'test' split
+        image_path = example['image']  # Assuming 'image' contains the path to the .npy file
+        question = example['caption']  # Assuming 'caption' contains the question or caption
+        # Upload the image
+        upload_image({"name": image_path})
+        # Get the model's response
+        response = process_image(question)
+        # Store predictions and references
+        predictions.append(response)
+        references.append(question)
+        # Print results for debugging
+        print(f"Question: {question}")
+        print(f"Model Response: {response}")
+        print("---")
+    # Compute evaluation metrics
+    bleu_score = bleu.compute(predictions=predictions, references=references)
+    rouge_score = rouge.compute(predictions=predictions, references=references)
+    print(f"BLEU Score: {bleu_score}")
+    print(f"ROUGE Score: {rouge_score}")
 # Gradio UI
 with gr.Blocks(theme=gr.themes.Soft()) as chat_ui:
+    gr.Markdown("ICliniq AI-Powered Medical Image Analysis Workspace")
     with gr.Row():
         with gr.Column(scale=1, min_width=200):
             chat_list = gr.Chatbot(value=[], label="Chat History", elem_id="chat-history")
     submit_button.click(chat_interface, question_input, chat_list)
     question_input.submit(chat_interface, question_input, chat_list)
+# Uncomment to test the model with the dataset
+# test_model_with_dataset()
+chat_ui.launch()