Spaces:

prithivMLmods
/

Agent-Dino

Running on Zero

App Files Files Community

prithivMLmods commited on 5 days ago

Commit

1912e47

verified ·

1 Parent(s): 394fa56

Update app.py

Browse files

Files changed (1) hide show

app.py +32 -11

app.py CHANGED Viewed

@@ -56,6 +56,26 @@ def glb_to_data_url(glb_path: str) -> str:
     b64_data = base64.b64encode(data).decode("utf-8")
     return f"data:model/gltf-binary;base64,{b64_data}"
 # Model class for Text-to-3D Generation (ShapE)
 class Model:
@@ -204,7 +224,7 @@ SYSTEM_PROMPT = """
         "2. **Code**: Write Python code to implement your solution.\n"
         "3. **Observation**: Analyze the output of the code and summarize the results.\n"
         "4. **Final Answer**: Provide a concise conclusion or final result.\n\n"
-        f"Task: {task}"
 """
@@ -357,7 +377,7 @@ def save_image(img: Image.Image) -> str:
     return unique_name
 @spaces.GPU(duration=60, enable_queue=True)
-#SG161222/RealVisXL_V5.0_Lightning
 def generate_image_fn(
     prompt: str,
     negative_prompt: str = "",
@@ -472,7 +492,7 @@ def generate(
     # --- 3D Generation branch ---
     if text.strip().lower().startswith("@3d"):
         prompt = text[len("@3d"):].strip()
-        yield " > Processing 3D Mesh Generation ███████▒▒▒ 69%"
         glb_path, used_seed = generate_3d_fn(
             prompt=prompt,
             seed=1,
@@ -481,7 +501,7 @@ def generate(
             randomize_seed=True,
         )
         # Copy the GLB file to a static folder.
-        yield " > Processing 3D Mesh Generation ████████▒▒ 95%"
         static_folder = os.path.join(os.getcwd(), "static")
         if not os.path.exists(static_folder):
             os.makedirs(static_folder)
@@ -495,7 +515,7 @@ def generate(
     # --- Image Generation branch ---
     if text.strip().lower().startswith("@image"):
         prompt = text[len("@image"):].strip()
-        yield " > Processing Image Generation ███████▒▒▒ 69%"
         image_paths, used_seed = generate_image_fn(
             prompt=prompt,
             negative_prompt="",
@@ -518,14 +538,14 @@ def generate(
         # If the command starts with "visit", then treat the rest as a URL
         if web_command.lower().startswith("visit"):
             url = web_command[len("visit"):].strip()
-            yield " > Processing Visiting webpage ███████▒▒▒ 69%"
             visitor = VisitWebpageTool()
             content = visitor.forward(url)
             yield content
         else:
             # Otherwise, treat the rest as a search query.
             query = web_command
-            yield " > Processing Web Query ███████▒▒▒ 69%"
             searcher = DuckDuckGoSearchTool()
             results = searcher.forward(query)
             yield results
@@ -534,7 +554,7 @@ def generate(
     # --- rAgent Reasoning branch ---
     if text.strip().lower().startswith("@ragent"):
         prompt = text[len("@ragent"):].strip()
-        yield " > Processing reasoning chain using Llama mode ████████▒▒ 95%"
         # Pass the current chat history (cleaned) to help inform the chain.
         for partial in ragent_reasoning(prompt, clean_chat_history(chat_history)):
             yield partial
@@ -542,7 +562,7 @@ def generate(
     # --- YOLO Object Detection branch ---
     if text.strip().lower().startswith("@yolo"):
-        yield " > Processing with yolo ███████▒▒▒ 69%"
         if not files or len(files) == 0:
             yield "Error: Please attach an image for YOLO object detection."
             return
@@ -617,7 +637,7 @@ def generate(
         # Stream the response
         buffer = ""
-        yield " > Processing with phi4 multimodal ███████▒▒▒ 69%"
         for new_text in streamer:
             buffer += new_text
             time.sleep(0.01)  # Small delay to simulate real-time streaming
@@ -661,7 +681,7 @@ def generate(
         thread.start()
         buffer = ""
-        yield " > Processing with Qwen2VL Ocr ███████▒▒▒ 69%"
         for new_text in streamer:
             buffer += new_text
             buffer = buffer.replace("<|im_end|>", "")
@@ -689,6 +709,7 @@ def generate(
         t.start()
         outputs = []
         for new_text in streamer:
             outputs.append(new_text)
             yield "".join(outputs)

     b64_data = base64.b64encode(data).decode("utf-8")
     return f"data:model/gltf-binary;base64,{b64_data}"
+def progress_bar_html(label: str) -> str:
+    """
+    Returns an HTML snippet for a thin progress bar with a label.
+    The progress bar is styled as a dark red animated bar.
+    """
+    return f'''
+<div style="display: flex; align-items: center;">
+    <span style="margin-right: 10px; font-size: 14px;">{label}</span>
+    <div style="width: 110px; height: 5px; background-color: #f0f0f0; border-radius: 2px; overflow: hidden;">
+        <div style="width: 100%; height: 100%; background-color: darkred; animation: loading 1.5s linear infinite;"></div>
+    </div>
+</div>
+<style>
+@keyframes loading {{
+    0% {{ transform: translateX(-100%); }}
+    100% {{ transform: translateX(100%); }}
+}}
+</style>
+    '''
 # Model class for Text-to-3D Generation (ShapE)
 class Model:
         "2. **Code**: Write Python code to implement your solution.\n"
         "3. **Observation**: Analyze the output of the code and summarize the results.\n"
         "4. **Final Answer**: Provide a concise conclusion or final result.\n\n"
+        f"Task: {{task}}"
 """
     return unique_name
 @spaces.GPU(duration=60, enable_queue=True)
+# SG161222/RealVisXL_V5.0_Lightning
 def generate_image_fn(
     prompt: str,
     negative_prompt: str = "",
     # --- 3D Generation branch ---
     if text.strip().lower().startswith("@3d"):
         prompt = text[len("@3d"):].strip()
+        yield progress_bar_html("Processing 3D Mesh Generation")
         glb_path, used_seed = generate_3d_fn(
             prompt=prompt,
             seed=1,
             randomize_seed=True,
         )
         # Copy the GLB file to a static folder.
+        yield progress_bar_html("Finalizing 3D Mesh Generation")
         static_folder = os.path.join(os.getcwd(), "static")
         if not os.path.exists(static_folder):
             os.makedirs(static_folder)
     # --- Image Generation branch ---
     if text.strip().lower().startswith("@image"):
         prompt = text[len("@image"):].strip()
+        yield progress_bar_html("Generating Image")
         image_paths, used_seed = generate_image_fn(
             prompt=prompt,
             negative_prompt="",
         # If the command starts with "visit", then treat the rest as a URL
         if web_command.lower().startswith("visit"):
             url = web_command[len("visit"):].strip()
+            yield progress_bar_html("Visiting Webpage")
             visitor = VisitWebpageTool()
             content = visitor.forward(url)
             yield content
         else:
             # Otherwise, treat the rest as a search query.
             query = web_command
+            yield progress_bar_html("Performing Web Search")
             searcher = DuckDuckGoSearchTool()
             results = searcher.forward(query)
             yield results
     # --- rAgent Reasoning branch ---
     if text.strip().lower().startswith("@ragent"):
         prompt = text[len("@ragent"):].strip()
+        yield progress_bar_html("Processing Reasoning Chain")
         # Pass the current chat history (cleaned) to help inform the chain.
         for partial in ragent_reasoning(prompt, clean_chat_history(chat_history)):
             yield partial
     # --- YOLO Object Detection branch ---
     if text.strip().lower().startswith("@yolo"):
+        yield progress_bar_html("Performing Object Detection")
         if not files or len(files) == 0:
             yield "Error: Please attach an image for YOLO object detection."
             return
         # Stream the response
         buffer = ""
+        yield progress_bar_html("Processing Phi-4 Multimodal")
         for new_text in streamer:
             buffer += new_text
             time.sleep(0.01)  # Small delay to simulate real-time streaming
         thread.start()
         buffer = ""
+        yield progress_bar_html("Processing with Qwen2VL OCR")
         for new_text in streamer:
             buffer += new_text
             buffer = buffer.replace("<|im_end|>", "")
         t.start()
         outputs = []
+        yield progress_bar_html("Processing Chat Response")
         for new_text in streamer:
             outputs.append(new_text)
             yield "".join(outputs)