Spaces:

Prashant26am
/

llava-chat

Sleeping

Prashant26am commited on May 24

Commit

70a8a19

1 Parent(s): e5d40e3

fix: Update model initialization for CPU support

Files changed (2) hide show

src/configs/settings.py CHANGED Viewed

@@ -3,7 +3,11 @@ Configuration settings for the LLaVA implementation.
 """
 import os
 from pathlib import Path
 # Project paths
 PROJECT_ROOT = Path(__file__).parent.parent.parent
@@ -14,7 +18,13 @@ EXAMPLES_DIR = PROJECT_ROOT / "examples"
 # Model settings
 MODEL_NAME = "liuhaotian/llava-v1.5-7b"
 MODEL_REVISION = "main"
-DEVICE = "cuda" if os.environ.get("CUDA_VISIBLE_DEVICES") else "cpu"
 # Generation settings
 DEFAULT_MAX_NEW_TOKENS = 512

 """
 import os
+import torch
 from pathlib import Path
+from ..utils.logging import get_logger
+logger = get_logger(__name__)
 # Project paths
 PROJECT_ROOT = Path(__file__).parent.parent.parent
 # Model settings
 MODEL_NAME = "liuhaotian/llava-v1.5-7b"
 MODEL_REVISION = "main"
+# Device detection
+DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
+if DEVICE == "cuda":
+    logger.info(f"Using CUDA device: {torch.cuda.get_device_name(0)}")
+else:
+    logger.info("CUDA not available, using CPU")
 # Generation settings
 DEFAULT_MAX_NEW_TOKENS = 512

src/models/llava_model.py CHANGED Viewed

@@ -16,20 +16,39 @@ class LLaVAModel:
     def __init__(self):
         """Initialize the LLaVA model and processor."""
-        logger.info(f"Initializing LLaVA model from {MODEL_NAME}")
-        self.processor = AutoProcessor.from_pretrained(
-            MODEL_NAME,
-            revision=MODEL_REVISION,
-            trust_remote_code=True
-        )
-        self.model = AutoModelForCausalLM.from_pretrained(
-            MODEL_NAME,
-            revision=MODEL_REVISION,
-            torch_dtype=torch.float16,
-            device_map="auto",
-            trust_remote_code=True
-        )
-        logger.info("Model initialization complete")
     def generate_response(
         self,

     def __init__(self):
         """Initialize the LLaVA model and processor."""
+        try:
+            logger.info(f"Initializing LLaVA model from {MODEL_NAME}")
+            logger.info(f"Using device: {DEVICE}")
+            # Initialize processor
+            self.processor = AutoProcessor.from_pretrained(
+                MODEL_NAME,
+                revision=MODEL_REVISION,
+                trust_remote_code=True
+            )
+            # Set model dtype based on device
+            model_dtype = torch.float32 if DEVICE == "cpu" else torch.float16
+            # Initialize model with appropriate settings
+            self.model = AutoModelForCausalLM.from_pretrained(
+                MODEL_NAME,
+                revision=MODEL_REVISION,
+                torch_dtype=model_dtype,
+                device_map="auto" if DEVICE == "cuda" else None,
+                trust_remote_code=True,
+                low_cpu_mem_usage=True
+            )
+            # Move model to device if not using device_map
+            if DEVICE == "cpu":
+                self.model = self.model.to(DEVICE)
+            logger.info("Model initialization complete")
+        except Exception as e:
+            logger.error(f"Error initializing model: {str(e)}")
+            raise
     def generate_response(
         self,