Spaces:

yuting111222
/

health-assistant

Sleeping

App Files Files Community

yuting111222 commited on Aug 4

Commit

a608ddf

1 Parent(s): f9b12dd

Update health assistant minimal with new services and improvements

Browse files

Files changed (7) hide show

__pycache__/__init__.cpython-313.pyc +0 -0
app/routers/ai_router.py +100 -16
app/services/integrated_food_analysis_service.py +234 -0
app/services/nutrition_api_service.py +1 -1
app/services/reference_detection_service.py +198 -0
app/services/weight_calculation_service.py +309 -0
app/services/weight_estimation_service.py +172 -108

__pycache__/__init__.cpython-313.pyc CHANGED Viewed

Binary files a/__pycache__/__init__.cpython-313.pyc and b/__pycache__/__init__.cpython-313.pyc differ

app/routers/ai_router.py CHANGED Viewed

@@ -3,6 +3,14 @@
 from fastapi import APIRouter, File, UploadFile, HTTPException
 from pydantic import BaseModel
 from typing import Dict, Any, List, Optional
 router = APIRouter(
     prefix="/ai",
@@ -10,6 +18,16 @@ router = APIRouter(
 )
 # 新增 Pydantic 模型定義
 class WeightEstimationResponse(BaseModel):
     food_type: str
     estimated_weight: float
@@ -33,29 +51,86 @@ async def analyze_food_image_endpoint(file: UploadFile = File(...)):
     if not file.content_type or not file.content_type.startswith("image/"):
         raise HTTPException(status_code=400, detail="上傳的檔案不是圖片格式。")
-    # 暫時返回測試回應
-    return {"food_name": "測試食物", "nutrition_info": {"calories": 100}}
 @router.post("/analyze-food-image-with-weight/", response_model=WeightEstimationResponse)
 async def analyze_food_image_with_weight_endpoint(file: UploadFile = File(...)):
     """
     整合食物辨識、重量估算與營養分析的端點。
-    包含信心度與誤差範圍，支援參考物偵測。
     """
     # 檢查上傳的檔案是否為圖片格式
     if not file.content_type or not file.content_type.startswith("image/"):
         raise HTTPException(status_code=400, detail="上傳的檔案不是圖片格式。")
-    # 暫時返回測試回應
-    return WeightEstimationResponse(
-        food_type="測試食物",
-        estimated_weight=150.0,
-        weight_confidence=0.85,
-        weight_error_range=[130.0, 170.0],
-        nutrition={"calories": 100, "protein": 5, "fat": 2, "carbs": 15},
-        reference_object="硬幣",
-        note="測試重量估算結果"
-    )
 @router.get("/health")
 async def health_check():
@@ -65,8 +140,17 @@ async def health_check():
     return {
         "status": "healthy",
         "services": {
-            "food_classification": "available",
-            "weight_estimation": "available",
-            "nutrition_api": "available"
         }
     }

 from fastapi import APIRouter, File, UploadFile, HTTPException
 from pydantic import BaseModel
 from typing import Dict, Any, List, Optional
+import logging
+# 導入新的整合服務
+from ..services.integrated_food_analysis_service import analyze_food_image_integrated
+# 設置日誌
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
 router = APIRouter(
     prefix="/ai",
 )
 # 新增 Pydantic 模型定義
+class IntegratedAnalysisResponse(BaseModel):
+    success: bool
+    analysis_time: float
+    food_analysis: Dict[str, Any]
+    reference_analysis: Dict[str, Any]
+    weight_analysis: Dict[str, Any]
+    nutrition_analysis: Dict[str, Any]
+    summary: Dict[str, Any]
+    architecture: Dict[str, str]
 class WeightEstimationResponse(BaseModel):
     food_type: str
     estimated_weight: float
     if not file.content_type or not file.content_type.startswith("image/"):
         raise HTTPException(status_code=400, detail="上傳的檔案不是圖片格式。")
+    try:
+        # 讀取圖片數據
+        image_bytes = await file.read()
+        # 使用新的整合服務進行分析
+        result = analyze_food_image_integrated(image_bytes, debug=False)
+        if not result.get("success", False):
+            raise HTTPException(status_code=500, detail=result.get("error_message", "分析失敗"))
+        # 返回簡化的結果
+        return {
+            "food_name": result["food_analysis"]["food_name"],
+            "nutrition_info": result["nutrition_analysis"]["adjusted_nutrition"]
+        }
+    except Exception as e:
+        logger.error(f"食物分析失敗: {str(e)}")
+        raise HTTPException(status_code=500, detail=f"分析失敗: {str(e)}")
 @router.post("/analyze-food-image-with-weight/", response_model=WeightEstimationResponse)
 async def analyze_food_image_with_weight_endpoint(file: UploadFile = File(...)):
     """
     整合食物辨識、重量估算與營養分析的端點。
+    使用新的架構：FOOD101 → YOLO(參考物) → SAM+DPT → USDA API
+    """
+    # 檢查上傳的檔案是否為圖片格式
+    if not file.content_type or not file.content_type.startswith("image/"):
+        raise HTTPException(status_code=400, detail="上傳的檔案不是圖片格式。")
+    try:
+        # 讀取圖片數據
+        image_bytes = await file.read()
+        # 使用新的整合服務進行分析
+        result = analyze_food_image_integrated(image_bytes, debug=False)
+        if not result.get("success", False):
+            raise HTTPException(status_code=500, detail=result.get("error_message", "分析失敗"))
+        # 轉換為舊格式以保持向後兼容
+        weight_analysis = result["weight_analysis"]
+        nutrition_analysis = result["nutrition_analysis"]
+        return WeightEstimationResponse(
+            food_type=result["food_analysis"]["food_name"],
+            estimated_weight=weight_analysis["estimated_weight"],
+            weight_confidence=weight_analysis["weight_confidence"],
+            weight_error_range=weight_analysis["weight_error_range"],
+            nutrition=nutrition_analysis["adjusted_nutrition"],
+            reference_object=weight_analysis["reference_object"],
+            note=f"使用新架構分析，耗時 {result['analysis_time']} 秒"
+        )
+    except Exception as e:
+        logger.error(f"重量估算分析失敗: {str(e)}")
+        raise HTTPException(status_code=500, detail=f"分析失敗: {str(e)}")
+@router.post("/analyze-food-image-integrated/")
+async def analyze_food_image_integrated_endpoint(file: UploadFile = File(...)):
+    """
+    新的整合分析端點，返回完整的分析結果
+    架構：FOOD101 → YOLO(參考物) → SAM+DPT → USDA API
     """
     # 檢查上傳的檔案是否為圖片格式
     if not file.content_type or not file.content_type.startswith("image/"):
         raise HTTPException(status_code=400, detail="上傳的檔案不是圖片格式。")
+    try:
+        # 讀取圖片數據
+        image_bytes = await file.read()
+        # 使用新的整合服務進行分析
+        result = analyze_food_image_integrated(image_bytes, debug=False)
+        return result
+    except Exception as e:
+        logger.error(f"整合分析失敗: {str(e)}")
+        raise HTTPException(status_code=500, detail=f"分析失敗: {str(e)}")
 @router.get("/health")
 async def health_check():
     return {
         "status": "healthy",
         "services": {
+            "food_classification": "available (FOOD101)",
+            "reference_detection": "available (YOLO)",
+            "weight_estimation": "available (SAM+DPT)",
+            "nutrition_api": "available (USDA)",
+            "integrated_analysis": "available"
+        },
+        "architecture": {
+            "layer_1": "FOOD101 (食物識別)",
+            "layer_2": "YOLO (參考物偵測)",
+            "layer_3": "SAM+DPT (重量計算)",
+            "layer_4": "USDA API (營養查詢)",
+            "layer_5": "重量調整 (營養計算)"
         }
     }

app/services/integrated_food_analysis_service.py ADDED Viewed

	@@ -0,0 +1,234 @@

+# 檔案路徑: app/services/integrated_food_analysis_service.py
+import logging
+import numpy as np
+from PIL import Image
+import io
+from typing import Dict, Any, List, Optional, Tuple
+from datetime import datetime
+# 導入各個服務
+from .ai_service import classify_food_image
+from .reference_detection_service import detect_reference_objects_from_image
+from .weight_calculation_service import calculate_food_weight
+from .nutrition_api_service import fetch_nutrition_data
+# 設置日誌
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+class IntegratedFoodAnalysisService:
+    def __init__(self):
+        """初始化整合食物分析服務"""
+        logger.info("初始化整合食物分析服務...")
+    def analyze_food_image(self, image_bytes: bytes, debug: bool = False) -> Dict[str, Any]:
+        """
+        整合食物分析主函數
+        新架構流程：
+        1. FOOD101 模型判斷食物
+        2. YOLO 主要判斷參考物在哪、大小為何
+        3. 再利用 SAM+DPT 去計算可能的重量
+        4. 再利用重量去乘上 USDA 每100克的數值
+        Args:
+            image_bytes: 圖片二進位數據
+            debug: 是否啟用調試模式
+        Returns:
+            Dict: 完整的分析結果
+        """
+        try:
+            logger.info("=== 開始整合食物分析 ===")
+            start_time = datetime.now()
+            # 將 bytes 轉換為 PIL Image
+            image = Image.open(io.BytesIO(image_bytes)).convert("RGB")
+            logger.info(f"圖片載入完成，尺寸: {image.size}")
+            # === 第一層：FOOD101 模型判斷食物 ===
+            logger.info("--- 第一層：FOOD101 食物識別 ---")
+            food_name = classify_food_image(image_bytes)
+            logger.info(f"FOOD101 識別結果: {food_name}")
+            if food_name.startswith("Error") or food_name == "Unknown":
+                return self._create_error_response("食物識別失敗", food_name)
+            # === 第二層：YOLO 判斷參考物 ===
+            logger.info("--- 第二層：YOLO 參考物偵測 ---")
+            reference_objects, pixel_ratio = detect_reference_objects_from_image(image_bytes)
+            if not reference_objects:
+                logger.warning("未偵測到參考物，使用預設像素比例")
+                pixel_ratio = 0.01  # 預設比例
+            best_reference = reference_objects[0] if reference_objects else None
+            logger.info(f"參考物偵測結果: {len(reference_objects)} 個參考物")
+            if best_reference:
+                logger.info(f"最佳參考物: {best_reference['label']}, 信心度: {best_reference['confidence']:.2f}")
+            logger.info(f"像素比例: {pixel_ratio:.4f} cm/pixel")
+            # === 第三層：SAM+DPT 重量計算 ===
+            logger.info("--- 第三層：SAM+DPT 重量計算 ---")
+            weight_result = calculate_food_weight(
+                image_bytes=image_bytes,
+                food_name=food_name,
+                pixel_ratio=pixel_ratio,
+                bbox=None  # 使用整個圖片
+            )
+            if not weight_result.get("success", False):
+                logger.error("重量計算失敗")
+                return self._create_error_response("重量計算失敗", weight_result.get("error", "未知錯誤"))
+            estimated_weight = weight_result["estimated_weight"]
+            weight_confidence = weight_result["weight_confidence"]
+            weight_error_range = weight_result["weight_error_range"]
+            logger.info(f"重量計算結果: {estimated_weight}g, 信心度: {weight_confidence:.2f}")
+            # === 第四層：USDA API 營養查詢 ===
+            logger.info("--- 第四層：USDA API 營養查詢 ---")
+            nutrition_info = fetch_nutrition_data(food_name)
+            if nutrition_info is None:
+                logger.warning("USDA API 查詢失敗，使用預設營養值")
+                nutrition_info = self._get_default_nutrition(food_name)
+            # === 第五層：根據重量調整營養素 ===
+            logger.info("--- 第五層：重量調整營養素 ---")
+            weight_ratio = estimated_weight / 100  # 每100克的營養值
+            adjusted_nutrition = {}
+            for nutrient, value in nutrition_info.items():
+                if nutrient not in ["food_name", "chinese_name"]:
+                    adjusted_nutrition[nutrient] = round(value * weight_ratio, 1)
+            logger.info(f"營養調整完成，重量比例: {weight_ratio:.2f}")
+            # === 生成分析報告 ===
+            analysis_time = (datetime.now() - start_time).total_seconds()
+            result = {
+                "success": True,
+                "analysis_time": round(analysis_time, 2),
+                "food_analysis": {
+                    "food_name": food_name,
+                    "recognition_method": "FOOD101",
+                    "confidence": 0.95  # FOOD101 通常有很高的準確度
+                },
+                "reference_analysis": {
+                    "detected_objects": reference_objects,
+                    "best_reference": best_reference,
+                    "pixel_ratio": pixel_ratio,
+                    "detection_method": "YOLO"
+                },
+                "weight_analysis": {
+                    "estimated_weight": estimated_weight,
+                    "weight_confidence": weight_confidence,
+                    "weight_error_range": weight_error_range,
+                    "calculation_method": "SAM+DPT",
+                    "reference_object": best_reference["label"] if best_reference else None
+                },
+                "nutrition_analysis": {
+                    "base_nutrition": nutrition_info,  # 每100克的營養值
+                    "adjusted_nutrition": adjusted_nutrition,  # 根據重量調整的營養值
+                    "data_source": "USDA API",
+                    "weight_ratio": weight_ratio
+                },
+                "summary": {
+                    "total_calories": adjusted_nutrition.get("calories", 0),
+                    "total_protein": adjusted_nutrition.get("protein", 0),
+                    "total_carbs": adjusted_nutrition.get("carbs", 0),
+                    "total_fat": adjusted_nutrition.get("fat", 0),
+                    "health_score": self._calculate_health_score(adjusted_nutrition)
+                },
+                "architecture": {
+                    "layer_1": "FOOD101 (食物識別)",
+                    "layer_2": "YOLO (參考物偵測)",
+                    "layer_3": "SAM+DPT (重量計算)",
+                    "layer_4": "USDA API (營養查詢)",
+                    "layer_5": "重量調整 (營養計算)"
+                }
+            }
+            logger.info("=== 整合食物分析完成 ===")
+            return result
+        except Exception as e:
+            logger.error(f"整合食物分析失敗: {str(e)}")
+            return self._create_error_response("整合分析失敗", str(e))
+    def _create_error_response(self, error_type: str, error_message: str) -> Dict[str, Any]:
+        """創建錯誤回應"""
+        return {
+            "success": False,
+            "error_type": error_type,
+            "error_message": error_message,
+            "timestamp": datetime.now().isoformat()
+        }
+    def _get_default_nutrition(self, food_name: str) -> Dict[str, Any]:
+        """取得預設營養值"""
+        default_nutrition = {
+            "food_name": food_name,
+            "calories": 100,
+            "protein": 5,
+            "fat": 2,
+            "carbs": 15,
+            "fiber": 2,
+            "sugar": 1,
+            "sodium": 200
+        }
+        return default_nutrition
+    def _calculate_health_score(self, nutrition: Dict[str, float]) -> int:
+        """計算健康評分"""
+        score = 100
+        # 熱量評分
+        calories = nutrition.get("calories", 0)
+        if calories > 400:
+            score -= 20
+        elif calories > 300:
+            score -= 10
+        # 脂肪評分
+        fat = nutrition.get("fat", 0)
+        if fat > 20:
+            score -= 15
+        elif fat > 15:
+            score -= 8
+        # 蛋白質評分
+        protein = nutrition.get("protein", 0)
+        if protein > 15:
+            score += 10
+        elif protein < 5:
+            score -= 10
+        # 鈉含量評分
+        sodium = nutrition.get("sodium", 0)
+        if sodium > 800:
+            score -= 15
+        elif sodium > 600:
+            score -= 8
+        return max(0, min(100, score))
+# 全域服務實例
+integrated_service = IntegratedFoodAnalysisService()
+def analyze_food_image_integrated(image_bytes: bytes, debug: bool = False) -> Dict[str, Any]:
+    """
+    整合食物分析的外部接口
+    Args:
+        image_bytes: 圖片二進位數據
+        debug: 是否啟用調試模式
+    Returns:
+        Dict: 完整的分析結果
+    """
+    return integrated_service.analyze_food_image(image_bytes, debug)

app/services/nutrition_api_service.py CHANGED Viewed

@@ -12,7 +12,7 @@ logger = logging.getLogger(__name__)
 load_dotenv()
 # 從環境變數中獲取 API 金鑰
-USDA_API_KEY = os.getenv("USDA_API_KEY", "DEMO_KEY")
 USDA_API_URL = "https://api.nal.usda.gov/fdc/v1/foods/search"
 # 我們關心的主要營養素及其在 USDA API 中的名稱或編號

 load_dotenv()
 # 從環境變數中獲取 API 金鑰
+USDA_API_KEY = os.getenv("USDA_API_KEY", "4guYMPsU2jSnN6GH6NjexZmSh1VWrgmOIoH6d6ju")
 USDA_API_URL = "https://api.nal.usda.gov/fdc/v1/foods/search"
 # 我們關心的主要營養素及其在 USDA API 中的名稱或編號

app/services/reference_detection_service.py ADDED Viewed

	@@ -0,0 +1,198 @@

+# 檔案路徑: app/services/reference_detection_service.py
+import logging
+import numpy as np
+from PIL import Image
+from typing import Dict, Any, List, Optional, Tuple
+from ultralytics import YOLO
+import io
+# 設置日誌
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+# 參考物尺寸表 (cm)
+REFERENCE_OBJECTS = {
+    "plate": {"diameter": 24.0, "type": "circular"},      # 標準餐盤直徑
+    "bowl": {"diameter": 15.0, "type": "circular"},       # 標準碗直徑
+    "spoon": {"length": 15.0, "type": "linear"},          # 湯匙長度
+    "fork": {"length": 20.0, "type": "linear"},           # 叉子長度
+    "knife": {"length": 20.0, "type": "linear"},          # 刀子長度
+    "coin": {"diameter": 2.4, "type": "circular"},        # 硬幣直徑
+    "credit_card": {"length": 8.5, "width": 5.4, "type": "rectangular"},  # 信用卡
+    "default": {"diameter": 24.0, "type": "circular"}     # 預設參考物
+}
+class ReferenceDetectionService:
+    def __init__(self):
+        """初始化參考物偵測服務"""
+        self.yolo_model = None
+        self._load_model()
+    def _load_model(self):
+        """載入 YOLO 模型"""
+        try:
+            logger.info("正在載入 YOLO 參考物偵測模型...")
+            # 使用 YOLOv8n 作為基礎模型
+            self.yolo_model = YOLO("yolov8n.pt")
+            logger.info("YOLO 模型載入完成！")
+        except Exception as e:
+            logger.error(f"YOLO 模型載入失敗: {str(e)}")
+            raise
+    def detect_reference_objects(self, image: Image.Image) -> List[Dict[str, Any]]:
+        """
+        使用 YOLO 偵測圖片中的參考物
+        Args:
+            image: PIL Image 物件
+        Returns:
+            List[Dict]: 包含參考物資訊的列表
+        """
+        try:
+            results = self.yolo_model(image)
+            reference_objects = []
+            for result in results[0].boxes.data.tolist():
+                x1, y1, x2, y2, conf, class_id = result
+                label = self.yolo_model.model.names[int(class_id)].lower()
+                # 只關注參考物類別
+                if self._is_reference_object(label) and conf > 0.3:
+                    reference_objects.append({
+                        "label": label,
+                        "bbox": [x1, y1, x2, y2],
+                        "confidence": conf,
+                        "area": (x2 - x1) * (y2 - y1),  # 像素面積
+                        "dimensions": self._get_reference_dimensions(label)
+                    })
+            # 按信心度排序，優先選擇高信心度的參考物
+            reference_objects.sort(key=lambda x: x["confidence"], reverse=True)
+            logger.info(f"偵測到 {len(reference_objects)} 個參考物: {[obj['label'] for obj in reference_objects]}")
+            return reference_objects
+        except Exception as e:
+            logger.error(f"參考物偵測失敗: {str(e)}")
+            return []
+    def _is_reference_object(self, label: str) -> bool:
+        """判斷是否為參考物"""
+        reference_labels = [
+            "plate", "bowl", "spoon", "fork", "knife",
+            "coin", "credit card", "card", "phone", "remote"
+        ]
+        return any(ref_label in label for ref_label in reference_labels)
+    def _get_reference_dimensions(self, label: str) -> Dict[str, Any]:
+        """取得參考物的實際尺寸"""
+        for ref_name, dimensions in REFERENCE_OBJECTS.items():
+            if ref_name in label:
+                return dimensions
+        return REFERENCE_OBJECTS["default"]
+    def calculate_pixel_ratio(self, reference_object: Dict[str, Any]) -> float:
+        """
+        根據參考物計算像素到實際距離的比例
+        Args:
+            reference_object: 參考物資訊
+        Returns:
+            float: 像素比例 (cm/pixel)
+        """
+        try:
+            bbox = reference_object["bbox"]
+            dimensions = reference_object["dimensions"]
+            # 計算參考物在圖片中的像素尺寸
+            pixel_width = bbox[2] - bbox[0]
+            pixel_height = bbox[3] - bbox[1]
+            if dimensions["type"] == "circular":
+                # 圓形參考物（如餐盤、碗、硬幣）
+                pixel_diameter = min(pixel_width, pixel_height)  # 取較小值作為直徑
+                actual_diameter = dimensions["diameter"]
+                pixel_ratio = actual_diameter / pixel_diameter
+            elif dimensions["type"] == "linear":
+                # 線性參考物（如餐具）
+                pixel_length = max(pixel_width, pixel_height)  # 取較大值作為長度
+                actual_length = dimensions["length"]
+                pixel_ratio = actual_length / pixel_length
+            elif dimensions["type"] == "rectangular":
+                # 矩形參考物（如信用卡）
+                pixel_length = max(pixel_width, pixel_height)
+                actual_length = dimensions["length"]
+                pixel_ratio = actual_length / pixel_length
+            else:
+                # 預設情況
+                pixel_ratio = 0.01  # 100像素 = 1cm
+            logger.info(f"參考物 {reference_object['label']} 像素比例: {pixel_ratio:.4f} cm/pixel")
+            return pixel_ratio
+        except Exception as e:
+            logger.error(f"計算像素比例失敗: {str(e)}")
+            return 0.01  # 預設值
+    def get_best_reference_object(self, reference_objects: List[Dict[str, Any]]) -> Optional[Dict[str, Any]]:
+        """
+        從偵測到的參考物中選擇最佳的參考物
+        Args:
+            reference_objects: 參考物列表
+        Returns:
+            Optional[Dict]: 最佳參考物，如果沒有則返回 None
+        """
+        if not reference_objects:
+            return None
+        # 優先選擇餐盤或碗，因為它們通常最穩定
+        priority_objects = ["plate", "bowl"]
+        for obj in reference_objects:
+            if any(priority in obj["label"] for priority in priority_objects):
+                return obj
+        # 如果沒有優先參考物，選擇信心度最高的
+        return reference_objects[0]
+# 全域服務實例
+reference_service = ReferenceDetectionService()
+def detect_reference_objects_from_image(image_bytes: bytes) -> Tuple[List[Dict[str, Any]], Optional[float]]:
+    """
+    從圖片中偵測參考物並計算像素比例
+    Args:
+        image_bytes: 圖片二進位數據
+    Returns:
+        Tuple[List[Dict], Optional[float]]: (參考物列表, 像素比例)
+    """
+    try:
+        image = Image.open(io.BytesIO(image_bytes)).convert("RGB")
+        # 偵測參考物
+        reference_objects = reference_service.detect_reference_objects(image)
+        # 選擇最佳參考物
+        best_reference = reference_service.get_best_reference_object(reference_objects)
+        # 計算像素比例
+        pixel_ratio = None
+        if best_reference:
+            pixel_ratio = reference_service.calculate_pixel_ratio(best_reference)
+        return reference_objects, pixel_ratio
+    except Exception as e:
+        logger.error(f"參考物偵測失敗: {str(e)}")
+        return [], None

app/services/weight_calculation_service.py ADDED Viewed

	@@ -0,0 +1,309 @@

+# 檔案路徑: app/services/weight_calculation_service.py
+import logging
+import numpy as np
+from PIL import Image
+import io
+from typing import Dict, Any, List, Optional, Tuple
+import torch
+from transformers import SamModel, SamProcessor, pipeline
+# 設置日誌
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+# 食物密度表 (g/cm³) - 常見食物的平均密度
+FOOD_DENSITY_TABLE = {
+    "rice": 0.8,           # 米飯
+    "fried_rice": 0.7,     # 炒飯
+    "noodles": 0.6,        # 麵條
+    "bread": 0.3,          # 麵包
+    "meat": 1.0,           # 肉類
+    "fish": 1.1,           # 魚類
+    "vegetables": 0.4,     # 蔬菜
+    "fruits": 0.8,         # 水果
+    "soup": 1.0,           # 湯類
+    "sushi": 0.9,          # 壽司
+    "pizza": 0.6,          # 披薩
+    "hamburger": 0.7,      # 漢堡
+    "salad": 0.3,          # 沙拉
+    "default": 0.8         # 預設密度
+}
+class WeightCalculationService:
+    def __init__(self):
+        """初始化重量計算服務"""
+        self.sam_model = None
+        self.sam_processor = None
+        self.dpt_model = None
+        self._load_models()
+    def _load_models(self):
+        """載入 SAM 和 DPT 模型"""
+        try:
+            # 載入 SAM 分割模型
+            logger.info("正在載入 SAM 分割模型...")
+            self.sam_model = SamModel.from_pretrained("facebook/sam-vit-base")
+            self.sam_processor = SamProcessor.from_pretrained("facebook/sam-vit-base")
+            # 載入 DPT 深度估計模型
+            logger.info("正在載入 DPT 深度估計模型...")
+            self.dpt_model = pipeline("depth-estimation", model="Intel/dpt-large")
+            logger.info("SAM 和 DPT 模型載入完成！")
+        except Exception as e:
+            logger.error(f"模型載入失敗: {str(e)}")
+            raise
+    def segment_food_area(self, image: Image.Image, bbox: List[float]) -> np.ndarray:
+        """
+        使用 SAM 分割食物區域
+        Args:
+            image: PIL Image 物件
+            bbox: 邊界框 [x1, y1, x2, y2]
+        Returns:
+            np.ndarray: 食物區域的遮罩
+        """
+        try:
+            # 使用 SAM 進行分割
+            inputs = self.sam_processor(image, input_boxes=[bbox], return_tensors="pt")
+            with torch.no_grad():
+                outputs = self.sam_model(**inputs)
+            # 取得分割遮罩
+            masks_tensor = self.sam_processor.image_processor.post_process_masks(
+                outputs.pred_masks.sigmoid(),
+                inputs["original_sizes"],
+                inputs["reshaped_input_sizes"]
+            )[0]
+            # 選擇最大的遮罩
+            mask = masks_tensor[0].squeeze().cpu().numpy().astype(bool)
+            logger.info(f"SAM 分割完成，遮罩大小: {mask.shape}")
+            return mask
+        except Exception as e:
+            logger.error(f"SAM 分割失敗: {str(e)}")
+            # 回傳預設遮罩
+            return np.ones((image.height, image.width), dtype=bool)
+    def estimate_depth(self, image: Image.Image) -> np.ndarray:
+        """
+        使用 DPT 進行深度估計
+        Args:
+            image: PIL Image 物件
+        Returns:
+            np.ndarray: 深度圖
+        """
+        try:
+            # 使用 DPT 進行深度估計
+            depth_result = self.dpt_model(image)
+            depth_map = depth_result["depth"]
+            logger.info(f"DPT 深度估計完成，深度圖大小: {depth_map.shape}")
+            return np.array(depth_map)
+        except Exception as e:
+            logger.error(f"DPT 深度估計失敗: {str(e)}")
+            # 回傳預設深度圖
+            return np.ones((image.height, image.width))
+    def calculate_volume_and_weight(self,
+                                  mask: np.ndarray,
+                                  depth_map: np.ndarray,
+                                  food_name: str,
+                                  pixel_ratio: float) -> Tuple[float, float, float]:
+        """
+        計算體積和重量
+        Args:
+            mask: 食物區域遮罩
+            depth_map: 深度圖
+            food_name: 食物名稱
+            pixel_ratio: 像素比例 (cm/pixel)
+        Returns:
+            Tuple[float, float, float]: (重量, 信心度, 誤差範圍)
+        """
+        try:
+            # 計算食物區域的像素數量
+            food_pixels = np.sum(mask)
+            logger.info(f"重量計算開始 - 食物: {food_name}, 像素數量: {food_pixels}")
+            # 計算食物區域的平均深度
+            food_depth_values = depth_map[mask]
+            if len(food_depth_values) > 0:
+                food_depth = np.mean(food_depth_values)
+                depth_variance = np.var(food_depth_values)
+            else:
+                food_depth = 1.0
+                depth_variance = 0.0
+            logger.info(f"深度分析 - 平均深度: {food_depth:.4f}, 深度變異: {depth_variance:.4f}")
+            # 計算實際面積 (cm²)
+            area_cm2 = food_pixels * (pixel_ratio ** 2)
+            logger.info(f"面積計算 - 像素比例: {pixel_ratio:.4f}, 實際面積: {area_cm2:.2f} cm²")
+            # 動態調整形狀因子 (基於深度資訊)
+            if depth_variance > 0:
+                # 深度變異大，表示食物較立體
+                shape_factor = np.clip(0.6 + (depth_variance * 0.2), 0.3, 0.8)
+            else:
+                # 深度變異小，表示食物較扁平
+                shape_factor = np.clip(0.4 + (food_depth * 0.2), 0.2, 0.7)
+            logger.info(f"形狀因子 - 動態調整: {shape_factor:.4f}")
+            # 計算體積 (cm³)
+            volume_cm3 = shape_factor * (area_cm2 ** 1.5)
+            logger.info(f"體積計算 - 估算體積: {volume_cm3:.2f} cm³")
+            # 取得食物密度
+            density = self._get_food_density(food_name)
+            logger.info(f"密度查詢 - 食物: {food_name}, 密度: {density} g/cm³")
+            # 計算重量 (g)
+            weight = volume_cm3 * density
+            logger.info(f"重量計算 - 原始重量: {weight:.2f} g")
+            # 合理性檢查和調整
+            if weight > 2000:  # 超過 2kg
+                logger.warning(f"重量 {weight:.2f}g 過高，進行調整")
+                weight = min(weight, 2000)
+            elif weight < 10:  # 少於 10g
+                logger.warning(f"重量 {weight:.2f}g 過低，進行調整")
+                weight = max(weight, 10)
+            # 計算信心度和誤差範圍
+            confidence = self._calculate_confidence(pixel_ratio, depth_variance, food_pixels)
+            error_range = self._calculate_error_range(confidence)
+            logger.info(f"最終結果 - 重量: {weight:.2f}g, 信心度: {confidence:.2f}, 誤差範圍: ±{error_range*100:.1f}%")
+            return weight, confidence, error_range
+        except Exception as e:
+            logger.error(f"重量計算失敗: {str(e)}")
+            return 150.0, 0.3, 0.5  # 預設值
+    def _get_food_density(self, food_name: str) -> float:
+        """根據食物名稱取得密度"""
+        food_name_lower = food_name.lower()
+        # 關鍵字匹配
+        for keyword, density in FOOD_DENSITY_TABLE.items():
+            if keyword in food_name_lower:
+                return density
+        return FOOD_DENSITY_TABLE["default"]
+    def _calculate_confidence(self, pixel_ratio: float, depth_variance: float, food_pixels: int) -> float:
+        """計算信心度"""
+        # 基礎信心度
+        base_confidence = 0.6
+        # 像素比例影響 (比例越合理，信心度越高)
+        if 0.005 <= pixel_ratio <= 0.05:
+            base_confidence += 0.2
+        elif 0.001 <= pixel_ratio <= 0.1:
+            base_confidence += 0.1
+        # 深度變異影響 (適中的變異表示好的深度估計)
+        if 0.01 <= depth_variance <= 0.1:
+            base_confidence += 0.1
+        elif depth_variance > 0.5:
+            base_confidence -= 0.1
+        # 像素數量影響 (適中的像素數量表示好的分割)
+        if 1000 <= food_pixels <= 100000:
+            base_confidence += 0.1
+        elif food_pixels < 100:
+            base_confidence -= 0.2
+        return np.clip(base_confidence, 0.1, 0.95)
+    def _calculate_error_range(self, confidence: float) -> float:
+        """根據信心度計算誤差範圍"""
+        # 信心度越高，誤差範圍越小
+        if confidence >= 0.8:
+            return 0.1  # ±10%
+        elif confidence >= 0.6:
+            return 0.2  # ±20%
+        elif confidence >= 0.4:
+            return 0.3  # ±30%
+        else:
+            return 0.5  # ±50%
+# 全域服務實例
+weight_calculation_service = WeightCalculationService()
+def calculate_food_weight(image_bytes: bytes,
+                         food_name: str,
+                         pixel_ratio: float,
+                         bbox: Optional[List[float]] = None) -> Dict[str, Any]:
+    """
+    計算食物重量的主函數
+    Args:
+        image_bytes: 圖片二進位數據
+        food_name: 食物名稱
+        pixel_ratio: 像素比例
+        bbox: 可選的邊界框，如果沒有提供則使用整個圖片
+    Returns:
+        Dict: 包含重量計算結果的字典
+    """
+    try:
+        image = Image.open(io.BytesIO(image_bytes)).convert("RGB")
+        # 如果沒有提供邊界框，使用整個圖片
+        if bbox is None:
+            bbox = [0, 0, image.width, image.height]
+        logger.info(f"開始計算 {food_name} 的重量，使用邊界框: {bbox}")
+        # 1. 使用 SAM 分割食物區域
+        mask = weight_calculation_service.segment_food_area(image, bbox)
+        # 2. 使用 DPT 進行深度估計
+        depth_map = weight_calculation_service.estimate_depth(image)
+        # 3. 計算體積和重量
+        weight, confidence, error_range = weight_calculation_service.calculate_volume_and_weight(
+            mask, depth_map, food_name, pixel_ratio
+        )
+        # 4. 計算誤差範圍
+        weight_min = weight * (1 - error_range)
+        weight_max = weight * (1 + error_range)
+        return {
+            "food_name": food_name,
+            "estimated_weight": round(weight, 1),
+            "weight_confidence": confidence,
+            "weight_error_range": [round(weight_min, 1), round(weight_max, 1)],
+            "pixel_ratio": pixel_ratio,
+            "calculation_method": "SAM+DPT",
+            "success": True
+        }
+    except Exception as e:
+        logger.error(f"重量計算主流程失敗: {str(e)}")
+        return {
+            "food_name": food_name,
+            "estimated_weight": 150.0,
+            "weight_confidence": 0.3,
+            "weight_error_range": [100.0, 200.0],
+            "pixel_ratio": pixel_ratio,
+            "calculation_method": "SAM+DPT",
+            "success": False,
+            "error": str(e)
+        }

app/services/weight_estimation_service.py CHANGED Viewed

@@ -6,6 +6,7 @@ from PIL import Image
 import io
 from typing import Dict, Any, List, Optional, Tuple
 import torch
 # 設置日誌
 logging.basicConfig(level=logging.INFO)
@@ -55,10 +56,10 @@ class WeightEstimationService:
             from transformers import pipeline
             logger.info("正在載入 DPT 深度估計模型...")
             self.dpt_model = pipeline("depth-estimation", model="Intel/dpt-large")
-            # 載入物件偵測模型（用於偵測參考物）
-            logger.info("正在載入物件偵測模型...")
-            self.detection_model = pipeline("object-detection", model="ultralytics/yolov5")
             logger.info("所有模型載入完成！")
@@ -66,61 +67,51 @@ class WeightEstimationService:
             logger.error(f"模型載入失敗: {str(e)}")
             raise
-    def detect_reference_objects(self, image: Image.Image) -> Optional[Dict[str, Any]]:
-        """偵測圖片中的參考物（餐盤、餐具等）"""
         try:
-            # 使用 YOLOv5 偵測物件
             results = self.detection_model(image)
-            reference_objects = []
-            for result in results:
-                label = result["label"].lower()
-                confidence = result["score"]
-                # 檢查是否為參考物
-                if any(ref in label for ref in ["plate", "bowl", "spoon", "fork", "knife"]):
-                    reference_objects.append({
-                        "type": label,
-                        "confidence": confidence,
-                        "bbox": result["box"]
                     })
-            if reference_objects:
-                # 選擇信心度最高的參考物
-                best_ref = max(reference_objects, key=lambda x: x["confidence"])
-                return best_ref
-            return None
         except Exception as e:
-            logger.warning(f"參考物偵測失敗: {str(e)}")
-            return None
-    def segment_food(self, image: Image.Image) -> np.ndarray:
-        """使用 SAM 分割食物區域"""
         try:
-            # 使用 SAM 進行分割
-            inputs = self.sam_processor(image, return_tensors="pt")
             with torch.no_grad():
                 outputs = self.sam_model(**inputs)
             # 取得分割遮罩
-            masks = self.sam_processor.image_processor.post_process_masks(
                 outputs.pred_masks.sigmoid(),
                 inputs["original_sizes"],
                 inputs["reshaped_input_sizes"]
             )[0]
-            # 選擇最大的遮罩作為食物區域
-            mask = masks[0].numpy()  # 簡化處理，選擇第一個遮罩
-            return mask
         except Exception as e:
             logger.error(f"食物分割失敗: {str(e)}")
-            # 回傳一個簡單的遮罩（整個圖片）
-            return np.ones((image.height, image.width), dtype=bool)
     def estimate_depth(self, image: Image.Image) -> np.ndarray:
         """使用 DPT 進行深度估計"""
@@ -154,7 +145,7 @@ class WeightEstimationService:
             # 如果有參考���，進行尺寸校正
             if reference_object:
-                ref_type = reference_object["type"]
                 if ref_type in REFERENCE_OBJECTS:
                     ref_size = REFERENCE_OBJECTS[ref_type]
                     # 根據參考物尺寸校正體積
@@ -180,11 +171,15 @@ class WeightEstimationService:
                 error_range = 0.4  # ±40% 誤差
             # 根據食物類型取得密度
-            density = FOOD_DENSITY_TABLE.get(food_type.lower(), FOOD_DENSITY_TABLE["default"])
             # 計算重量 (g)
             weight = actual_volume * density
             return weight, confidence, error_range
         except Exception as e:
@@ -200,7 +195,7 @@ class WeightEstimationService:
             return FOOD_DENSITY_TABLE["rice"]
         elif any(keyword in food_name_lower for keyword in ["noodle", "麵"]):
             return FOOD_DENSITY_TABLE["noodles"]
-        elif any(keyword in food_name_lower for keyword in ["meat", "肉"]):
             return FOOD_DENSITY_TABLE["meat"]
         elif any(keyword in food_name_lower for keyword in ["vegetable", "菜"]):
             return FOOD_DENSITY_TABLE["vegetables"]
@@ -210,87 +205,156 @@ class WeightEstimationService:
 # 全域服務實例
 weight_service = WeightEstimationService()
-async def estimate_food_weight(image_bytes: bytes) -> Dict[str, Any]:
     """
-    整合食物辨識、重量估算與營養分析的主函數
     """
     try:
         # 將 bytes 轉換為 PIL Image
-        image = Image.open(io.BytesIO(image_bytes))
-        # 1. 食物辨識（使用現有的 AI 服務）
-        from .ai_service import classify_food_image
-        food_name = classify_food_image(image_bytes)
-        # 2. 偵測參考物
-        reference_object = weight_service.detect_reference_objects(image)
-        # 3. 食物分割
-        food_mask = weight_service.segment_food(image)
-        # 4. 深度估計
         depth_map = weight_service.estimate_depth(image)
-        # 5. 計算體積和重量
-        weight, confidence, error_range = weight_service.calculate_volume_and_weight(
-            food_mask, depth_map, food_name, reference_object
-        )
-        # 6. 查詢營養資訊
         from .nutrition_api_service import fetch_nutrition_data
-        nutrition_info = fetch_nutrition_data(food_name)
-        if nutrition_info is None:
-            nutrition_info = {
-                "calories": 150,
-                "protein": 5,
-                "carbs": 25,
-                "fat": 3,
-                "fiber": 2
-            }
-        # 7. 根據重量調整營養素
-        weight_ratio = weight / 100  # 假設營養資訊是每100g的數據
-        adjusted_nutrition = {
-            key: value * weight_ratio
-            for key, value in nutrition_info.items()
-        }
-        # 8. 計算誤差範圍
-        error_min = weight * (1 - error_range)
-        error_max = weight * (1 + error_range)
-        # 9. 生成備註
         if reference_object:
-            note = f"檢測到參考物：{reference_object['type']}，準確度較高"
         else:
-            note = "未檢測到參考物，重量為估算值，僅供參考"
-        return {
-            "food_type": food_name,
-            "estimated_weight": round(weight, 1),
-            "weight_confidence": round(confidence, 2),
-            "weight_error_range": [round(error_min, 1), round(error_max, 1)],
-            "nutrition": adjusted_nutrition,
-            "reference_object": reference_object["type"] if reference_object else None,
             "note": note
         }
     except Exception as e:
-        logger.error(f"重量估算失敗: {str(e)}")
-        # 回傳預設結果
-        return {
-            "food_type": "Unknown",
-            "estimated_weight": 150.0,
-            "weight_confidence": 0.3,
-            "weight_error_range": [100.0, 200.0],
-            "nutrition": {
-                "calories": 150,
-                "protein": 5,
-                "carbs": 25,
-                "fat": 3,
-                "fiber": 2
-            },
             "reference_object": None,
-            "note": "分析失敗，顯示預設值"
-        }

 import io
 from typing import Dict, Any, List, Optional, Tuple
 import torch
+from ultralytics import YOLO
 # 設置日誌
 logging.basicConfig(level=logging.INFO)
             from transformers import pipeline
             logger.info("正在載入 DPT 深度估計模型...")
             self.dpt_model = pipeline("depth-estimation", model="Intel/dpt-large")
+            # 載入 YOLOv8 物件偵測模型（用於偵測參考物）
+            logger.info("正在載入 YOLOv8 物件偵測模型...")
+            self.detection_model = YOLO("yolov8n.pt")  # 你可以改成 yolov5s.pt 或自訂模型
             logger.info("所有模型載入完成！")
             logger.error(f"模型載入失敗: {str(e)}")
             raise
+    def detect_objects(self, image: Image.Image) -> List[Dict[str, Any]]:
+        """使用 YOLOv8 偵測圖片中的所有物體"""
         try:
             results = self.detection_model(image)
+            detected_objects = []
+            for result in results[0].boxes.data.tolist():
+                x1, y1, x2, y2, conf, class_id = result
+                label = self.detection_model.model.names[int(class_id)].lower()
+                # 我們對所有高信度的物體都感興趣，除了明確的餐具
+                if conf > 0.4 and label not in ["spoon", "fork", "knife", "scissors"]:
+                    detected_objects.append({
+                        "label": label,
+                        "bbox": [x1, y1, x2, y2],
+                        "confidence": conf
                     })
+            return detected_objects
         except Exception as e:
+            logger.warning(f"物件偵測失敗: {str(e)}")
+            return []
+    def segment_food(self, image: Image.Image, input_boxes: List[List[float]]) -> List[np.ndarray]:
+        """使用 SAM 根據提供的邊界框分割食物區域"""
+        if not input_boxes:
+            return []
         try:
+            # 使用 SAM 進行分割，並提供邊界框作為提示
+            inputs = self.sam_processor(image, input_boxes=[input_boxes], return_tensors="pt")
             with torch.no_grad():
                 outputs = self.sam_model(**inputs)
             # 取得分割遮罩
+            masks_tensor = self.sam_processor.image_processor.post_process_masks(
                 outputs.pred_masks.sigmoid(),
                 inputs["original_sizes"],
                 inputs["reshaped_input_sizes"]
             )[0]
+            # 將 Tensor 轉換為 list of numpy arrays
+            masks = [m.squeeze().cpu().numpy().astype(bool) for m in masks_tensor]
+            return masks
         except Exception as e:
             logger.error(f"食物分割失敗: {str(e)}")
+            return []
     def estimate_depth(self, image: Image.Image) -> np.ndarray:
         """使用 DPT 進行深度估計"""
             # 如果有參考���，進行尺寸校正
             if reference_object:
+                ref_type = reference_object["label"] # Changed from "type" to "label"
                 if ref_type in REFERENCE_OBJECTS:
                     ref_size = REFERENCE_OBJECTS[ref_type]
                     # 根據參考物尺寸校正體積
                 error_range = 0.4  # ±40% 誤差
             # 根據食物類型取得密度
+            density = self.get_food_density(food_type)
             # 計算重量 (g)
             weight = actual_volume * density
+            # 對單一物件的重量做一個合理性檢查
+            if weight > 1500: # > 1.5kg
+                logger.warning(f"單一物件預估重量 {weight:.2f}g 過高，可能不準確。")
             return weight, confidence, error_range
         except Exception as e:
             return FOOD_DENSITY_TABLE["rice"]
         elif any(keyword in food_name_lower for keyword in ["noodle", "麵"]):
             return FOOD_DENSITY_TABLE["noodles"]
+        elif any(keyword in food_name_lower for keyword in ["meat", "肉", "chicken", "pork", "beef", "lamb"]):
             return FOOD_DENSITY_TABLE["meat"]
         elif any(keyword in food_name_lower for keyword in ["vegetable", "菜"]):
             return FOOD_DENSITY_TABLE["vegetables"]
 # 全域服務實例
 weight_service = WeightEstimationService()
+async def estimate_food_weight(image_bytes: bytes, debug: bool = False) -> Dict[str, Any]:
     """
+    整合食物辨識、重量估算與營養分析的主函數 (YOLO + SAM 引導模式)
     """
+    debug_dir = None
     try:
+        if debug:
+            import os
+            from datetime import datetime
+            timestamp = datetime.now().strftime("%Y%m%d_%H%M%S_%f")
+            debug_dir = os.path.join("debug_output", timestamp)
+            os.makedirs(debug_dir, exist_ok=True)
         # 將 bytes 轉換為 PIL Image
+        image = Image.open(io.BytesIO(image_bytes)).convert("RGB")
+        if debug:
+            image.save(os.path.join(debug_dir, "00_original.jpg"))
+        # 1. 物件偵測 (YOLO)，取得所有物件的邊界框
+        all_objects = weight_service.detect_objects(image)
+        if not all_objects:
+            note = "無法從圖片中偵測到任何物體。"
+            result = {"detected_foods": [], "total_estimated_weight": 0, "total_nutrition": {}, "note": note}
+            if debug: result["debug_output_path"] = debug_dir
+            return result
+        if debug:
+            from PIL import ImageDraw
+            debug_image = image.copy()
+            draw = ImageDraw.Draw(debug_image)
+            for obj in all_objects:
+                bbox = obj.get("bbox")
+                label = obj.get("label", "unknown")
+                draw.rectangle(bbox, outline="red", width=3)
+                draw.text((bbox[0], bbox[1]), label, fill="red")
+            debug_image.save(os.path.join(debug_dir, "01_detected_objects.jpg"))
+        # 2. 尋找參考物 (如餐盤、碗)
+        reference_objects = [obj for obj in all_objects if obj["label"] in ["plate", "bowl"]]
+        reference_object = max(reference_objects, key=lambda x: x["confidence"]) if reference_objects else None
+        # 3. 深度估計 (DPT)，只需執行一次
         depth_map = weight_service.estimate_depth(image)
+        if debug:
+            depth_for_save = (depth_map - np.min(depth_map)) / (np.max(depth_map) - np.min(depth_map) + 1e-6) * 255.0
+            Image.fromarray(depth_for_save.astype(np.uint8)).convert("L").save(os.path.join(debug_dir, "03_depth_map.png"))
+        # 載入相關服務
+        from .ai_service import classify_food_image
         from .nutrition_api_service import fetch_nutrition_data
+        detected_foods = []
+        total_nutrition = {"calories": 0, "protein": 0, "carbs": 0, "fat": 0, "fiber": 0}
+        # 4. 遍歷每個偵測到的物件 (YOLO Box)
+        food_objects = [obj for obj in all_objects if obj["label"] not in ["plate", "bowl"]]
+        for i, food_obj in enumerate(food_objects):
+            try:
+                # a. 使用物件的邊界框提示 SAM 進行精準分割
+                input_box = [food_obj["bbox"]]
+                masks = weight_service.segment_food(image, input_boxes=input_box)
+                if not masks: continue
+                # SAM 對於一個 prompt 可能回傳多個 mask，我們選最大的一個
+                mask = max(masks, key=lambda m: np.sum(m))
+                # b. 根據遮罩裁切出單一食物的圖片 (辨識用)
+                # (此部分邏輯與先前版本相同)
+                rows, cols = np.any(mask, axis=1), np.any(mask, axis=0)
+                if not np.any(rows) or not np.any(cols): continue
+                rmin, rmax = np.where(rows)[0][[0, -1]]
+                cmin, cmax = np.where(cols)[0][[0, -1]]
+                item_array = np.array(image); item_rgba = np.zeros((*item_array.shape[:2], 4), dtype=np.uint8)
+                item_rgba[:,:,:3] = item_array; item_rgba[:,:,3] = mask * 255
+                cropped_pil = Image.fromarray(item_rgba[rmin:rmax+1, cmin:cmax+1, :], 'RGBA')
+                buffer = io.BytesIO(); cropped_pil.save(buffer, format="PNG"); item_image_bytes = buffer.getvalue()
+                if debug:
+                    cropped_pil.save(os.path.join(debug_dir, f"item_{i}_{food_obj['label']}_cropped.png"))
+                # c. 辨識食物種類 (使用更精準的食物辨識模型)
+                food_name = classify_food_image(item_image_bytes)
+                # d. 計算體積和重量
+                weight, confidence, error_range = weight_service.calculate_volume_and_weight(
+                    mask, depth_map, food_name, reference_object
+                )
+                # e. 查詢營養資訊
+                nutrition_info = fetch_nutrition_data(food_name)
+                if nutrition_info is None:
+                    nutrition_info = {"calories": 0, "protein": 0, "carbs": 0, "fat": 0, "fiber": 0}
+                # f. 根據重量調整營養素
+                weight_ratio = weight / 100
+                adjusted_nutrition = {k: v * weight_ratio for k, v in nutrition_info.items()}
+                # g. 累加總營養
+                for key in total_nutrition: total_nutrition[key] += adjusted_nutrition.get(key, 0)
+                # h. 儲存單項食物結果
+                detected_foods.append({
+                    "food_name": food_name,
+                    "estimated_weight": round(weight, 1),
+                    "nutrition": {k: round(v, 1) for k, v in adjusted_nutrition.items()}
+                })
+            except Exception as item_e:
+                logger.error(f"處理物件 '{food_obj['label']}' 時失敗: {str(item_e)}")
+                continue
+        # 5. 生成備註
+        note = f"已使用 YOLO+SAM 模型成功分析 {len(detected_foods)} 項食物。"
         if reference_object:
+            note += f" 檢測到參考物：{reference_object['label']}，準確度較高。"
         else:
+            note += " 未檢測到參考物，重量為估算值，結果僅供參考。"
+        result = {
+            "detected_foods": detected_foods,
+            "total_estimated_weight": round(sum(item['estimated_weight'] for item in detected_foods), 1),
+            "total_nutrition": {k: round(v, 1) for k, v in total_nutrition.items()},
+            "reference_object": reference_object["label"] if reference_object else None,
             "note": note
         }
+        if debug:
+            # 儲存最終分割圖
+            overlay_img = image.copy()
+            overlay_array = np.array(overlay_img)
+            # Find all masks again to draw
+            all_food_boxes = [obj['bbox'] for obj in food_objects]
+            all_masks = weight_service.segment_food(image, input_boxes=all_food_boxes)
+            for mask in all_masks:
+                color = np.random.randint(0, 255, size=3, dtype=np.uint8)
+                overlay_array[mask] = (overlay_array[mask] * 0.5 + color * 0.5).astype(np.uint8)
+            Image.fromarray(overlay_array).save(os.path.join(debug_dir, "02_final_segmentation.jpg"))
+            result["debug_output_path"] = debug_dir
+        return result
     except Exception as e:
+        logger.error(f"多食物重量估算主流程失敗: {str(e)}")
+        # 回傳包含錯誤訊息的標準結構
+        result = {
+            "detected_foods": [],
+            "total_estimated_weight": 0,
+            "total_nutrition": {},
             "reference_object": None,
+            "note": f"分析失敗: {str(e)}"
+        }
+        if debug and debug_dir:
+            result["debug_output_path"] = debug_dir
+        return result