Spaces:

Rohith1112
/

ICLINIQ

Sleeping

App Files Files Community

Rohith1112 commited on Mar 4

Commit

e7bcdf0

verified ·

1 Parent(s): aff94f6

U

Browse files

Files changed (1) hide show

app.py +30 -77

app.py CHANGED Viewed

@@ -4,11 +4,9 @@ import torch
 from transformers import AutoTokenizer, AutoModelForCausalLM
 import gradio as gr
 import matplotlib.pyplot as plt
-from datasets import load_dataset
-from evaluate import load  # For evaluation metrics
 # Model setup
-device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')  # Use GPU if available
 dtype = torch.float32
 model_name_or_path = 'GoodBaiBai88/M3D-LaMed-Phi-3-4B'
 proj_out_num = 256
@@ -16,8 +14,8 @@ proj_out_num = 256
 # Load model and tokenizer
 model = AutoModelForCausalLM.from_pretrained(
     model_name_or_path,
-    torch_dtype=dtype,
-    device_map=device.type,
     trust_remote_code=True
 )
@@ -29,50 +27,43 @@ tokenizer = AutoTokenizer.from_pretrained(
     trust_remote_code=True
 )
-# Load the M3D-Cap dataset
-dataset = load_dataset("GoodBaiBai88/M3D-Cap")
 # Chat history storage
 chat_history = []
 current_image = None
 def extract_and_display_images(image_path):
-    try:
-        npy_data = np.load(image_path)
-        if npy_data.ndim == 4 and npy_data.shape[1] == 32:
-            npy_data = npy_data[0]
-        elif npy_data.ndim != 3 or npy_data.shape[0] != 32:
-            return "Invalid .npy file format. Expected shape (1, 32, 256, 256) or (32, 256, 256)."
-        fig, axes = plt.subplots(4, 8, figsize=(12, 6))
-        for i, ax in enumerate(axes.flat):
-            ax.imshow(npy_data[i], cmap='gray')
-            ax.axis('off')
-        image_output = "extracted_images.png"
-        plt.savefig(image_output, bbox_inches='tight')
-        plt.close()
-        return image_output
-    except Exception as e:
-        return f"Error processing image: {str(e)}"
 def process_image(question):
     global current_image
     if current_image is None:
         return "Please upload an image first."
-    try:
-        image_np = np.load(current_image)
-        image_tokens = "<im_patch>" * proj_out_num
-        input_txt = image_tokens + question
-        input_id = tokenizer(input_txt, return_tensors="pt")['input_ids'].to(device=device)
-        image_pt = torch.from_numpy(image_np).unsqueeze(0).to(dtype=dtype, device=device)
-        generation = model.generate(image_pt, input_id, max_new_tokens=256, do_sample=True, top_p=0.9, temperature=1.0)
-        generated_texts = tokenizer.batch_decode(generation, skip_special_tokens=True)
-        return generated_texts[0]
-    except Exception as e:
-        return f"Error generating response: {str(e)}"
 def chat_interface(question):
     global chat_history
@@ -80,48 +71,13 @@ def chat_interface(question):
     chat_history.append((question, response))
     return chat_history
 def upload_image(image):
     global current_image
     current_image = image.name
     extracted_image_path = extract_and_display_images(current_image)
     return "Image uploaded and processed successfully!", extracted_image_path
-def test_model_with_dataset():
-    # Load evaluation metrics
-    bleu = load("bleu")
-    rouge = load("rouge")
-    # Initialize lists to store predictions and references
-    predictions = []
-    references = []
-    # Iterate over the dataset
-    for example in dataset['train']:  # Use 'train', 'validation', or 'test' split
-        image_path = example['image']  # Assuming 'image' contains the path to the .npy file
-        question = example['caption']  # Assuming 'caption' contains the question or caption
-        # Upload the image
-        upload_image({"name": image_path})
-        # Get the model's response
-        response = process_image(question)
-        # Store predictions and references
-        predictions.append(response)
-        references.append(question)
-        # Print results for debugging
-        print(f"Question: {question}")
-        print(f"Model Response: {response}")
-        print("---")
-    # Compute evaluation metrics
-    bleu_score = bleu.compute(predictions=predictions, references=references)
-    rouge_score = rouge.compute(predictions=predictions, references=references)
-    print(f"BLEU Score: {bleu_score}")
-    print(f"ROUGE Score: {rouge_score}")
 # Gradio UI
 with gr.Blocks(theme=gr.themes.Soft()) as chat_ui:
     gr.Markdown("ICliniq AI-Powered Medical Image Analysis Workspace")
@@ -139,7 +95,4 @@ with gr.Blocks(theme=gr.themes.Soft()) as chat_ui:
     submit_button.click(chat_interface, question_input, chat_list)
     question_input.submit(chat_interface, question_input, chat_list)
-# Uncomment to test the model with the dataset
-# test_model_with_dataset()
 chat_ui.launch()

 from transformers import AutoTokenizer, AutoModelForCausalLM
 import gradio as gr
 import matplotlib.pyplot as plt
 # Model setup
+device = torch.device('cpu')  # Use 'cuda' if GPU is available
 dtype = torch.float32
 model_name_or_path = 'GoodBaiBai88/M3D-LaMed-Phi-3-4B'
 proj_out_num = 256
 # Load model and tokenizer
 model = AutoModelForCausalLM.from_pretrained(
     model_name_or_path,
+    torch_dtype=torch.float32,
+    device_map='cpu',
     trust_remote_code=True
 )
     trust_remote_code=True
 )
 # Chat history storage
 chat_history = []
 current_image = None
 def extract_and_display_images(image_path):
+    npy_data = np.load(image_path)
+    if npy_data.ndim == 4 and npy_data.shape[1] == 32:
+        npy_data = npy_data[0]
+    elif npy_data.ndim != 3 or npy_data.shape[0] != 32:
+        return "Invalid .npy file format. Expected shape (1, 32, 256, 256) or (32, 256, 256)."
+    fig, axes = plt.subplots(4, 8, figsize=(12, 6))
+    for i, ax in enumerate(axes.flat):
+        ax.imshow(npy_data[i], cmap='gray')
+        ax.axis('off')
+    image_output = "extracted_images.png"
+    plt.savefig(image_output, bbox_inches='tight')
+    plt.close()
+    return image_output
 def process_image(question):
     global current_image
     if current_image is None:
         return "Please upload an image first."
+    image_np = np.load(current_image)
+    image_tokens = "<im_patch>" * proj_out_num
+    input_txt = image_tokens + question
+    input_id = tokenizer(input_txt, return_tensors="pt")['input_ids'].to(device=device)
+    image_pt = torch.from_numpy(image_np).unsqueeze(0).to(dtype=dtype, device=device)
+    generation = model.generate(image_pt, input_id, max_new_tokens=256, do_sample=True, top_p=0.9, temperature=1.0)
+    generated_texts = tokenizer.batch_decode(generation, skip_special_tokens=True)
+    return generated_texts[0]
 def chat_interface(question):
     global chat_history
     chat_history.append((question, response))
     return chat_history
 def upload_image(image):
     global current_image
     current_image = image.name
     extracted_image_path = extract_and_display_images(current_image)
     return "Image uploaded and processed successfully!", extracted_image_path
 # Gradio UI
 with gr.Blocks(theme=gr.themes.Soft()) as chat_ui:
     gr.Markdown("ICliniq AI-Powered Medical Image Analysis Workspace")
     submit_button.click(chat_interface, question_input, chat_list)
     question_input.submit(chat_interface, question_input, chat_list)
 chat_ui.launch()