Spaces:

SmartHeal
/

SmartHeal-Agentic-AI

Running

App Files Files Community

SmartHeal commited on Aug 13

Commit

2baa1e7

verified ·

1 Parent(s): ef69ec1

Update src/ai_processor.py

Browse files

Files changed (1) hide show

src/ai_processor.py +96 -123

src/ai_processor.py CHANGED Viewed

@@ -1,6 +1,10 @@
 # smartheal_ai_processor.py
-# Fully functional: robust segmentation + safe overlays + conditional GPU wrapper.
-# All original class/function names preserved. New helpers are additive.
 import os
 import time
@@ -8,12 +12,12 @@ import logging
 from datetime import datetime
 from typing import Optional, Dict, List, Tuple
-# --- quiet tokenizers fork warning (HF) ---
 os.environ.setdefault("TOKENIZERS_PARALLELISM", "false")
 import cv2
 import numpy as np
-from PIL import Image, ImageOps
 from PIL.ExifTags import TAGS
 logging.basicConfig(level=logging.INFO, format="%(asctime)s - %(levelname)s - %(message)s")
@@ -26,8 +30,8 @@ YOLO_MODEL_PATH = "src/best.pt"
 SEG_MODEL_PATH = "src/segmentation_model.h5"   # optional
 GUIDELINE_PDFS = ["src/eHealth in Wound Care.pdf", "src/IWGDF Guideline.pdf", "src/evaluation.pdf"]
 DATASET_ID = "SmartHeal/wound-image-uploads"
-DEFAULT_PX_PER_CM = 38.0  # fallback when we cannot calibrate
-PX_PER_CM_MIN, PX_PER_CM_MAX = 5.0, 1200.0  # sanity bounds
 models_cache: Dict[str, object] = {}
 knowledge_base_cache: Dict[str, object] = {}
@@ -39,7 +43,7 @@ def _import_ultralytics():
 def _import_tf_loader():
     import tensorflow as tf
-    tf.config.set_visible_devices([], "GPU")  # force CPU for TF to avoid CUDA contention
     from tensorflow.keras.models import load_model
     return load_model
@@ -63,8 +67,7 @@ def _import_hf_hub():
     from huggingface_hub import HfApi, HfFolder
     return HfApi, HfFolder
-# ---------- Conditional Spaces GPU function ----------
-# Avoid scheduling a GPU worker when CUDA is not available (prevents cudaGetDeviceCount crash)
 def _cuda_available() -> bool:
     try:
         import torch
@@ -81,7 +84,6 @@ def _generate_medgemma_report_core(
 ) -> str:
     try:
         from transformers import pipeline
-        # Use CPU by default; if CUDA truly available, pipeline can still map automatically
         pipe = pipeline(
             "image-text-to-text",
             model="google/medgemma-4b-it",
@@ -123,8 +125,6 @@ def _generate_medgemma_report_core(
         logging.error(f"❌ MedGemma generation error: {e}")
         return "⚠️ GPU/LLM worker unavailable"
-# Preserve the SAME public function name.
-# Only decorate with @spaces.GPU if CUDA is truly available.
 try:
     import spaces
     if _cuda_available():
@@ -145,7 +145,6 @@ try:
             image_pil: Image.Image,
             max_new_tokens: Optional[int] = None,
         ) -> str:
-            # no decorator -> no GPU worker init -> no cudaGetDeviceCount crash
             return _generate_medgemma_report_core(patient_info, visual_results, guideline_context, image_pil, max_new_tokens)
 except Exception:
     def generate_medgemma_report(
@@ -289,7 +288,6 @@ def estimate_px_per_cm_from_exif(pil_img: Image.Image, default_px_per_cm: float
         f35 = _to_float(exif.get("FocalLengthIn35mmFilm") or exif.get("FocalLengthIn35mm"))
         subj_dist_m = _to_float(exif.get("SubjectDistance"))
         sensor_w_mm = _estimate_sensor_width_mm(f_mm, f35)
         meta.update({"f_mm": f_mm, "f35": f35, "sensor_w_mm": sensor_w_mm, "distance_m": subj_dist_m})
         if f_mm and sensor_w_mm and subj_dist_m and subj_dist_m > 0:
@@ -304,64 +302,65 @@ def estimate_px_per_cm_from_exif(pil_img: Image.Image, default_px_per_cm: float
     except Exception:
         return float(default_px_per_cm), meta
-# ---------- Segmentation helpers (additive; names preserved elsewhere) ----------
-def _get_seg_hw(seg_model) -> Tuple[int, int]:
-    shp = getattr(seg_model, "input_shape", None)
-    if shp and len(shp) >= 4:
-        return int(shp[1]), int(shp[2])
-    # try Keras .inputs shape
-    try:
-        shp = seg_model.inputs[0].shape
-        return int(shp[1]), int(shp[2])
-    except Exception:
-        pass
-    raise ValueError(f"Cannot infer (H,W) from segmentation model input shape: {shp}")
-def _to_prob(mask_pred: np.ndarray) -> np.ndarray:
-    m = np.array(mask_pred)
-    # squeeze batch/channel dims
-    while m.ndim > 2:
-        if m.shape[0] == 1:
-            m = np.squeeze(m, axis=0)
-        if m.ndim > 2 and m.shape[-1] == 1:
-            m = np.squeeze(m, axis=-1)
-        if m.ndim == 3 and m.shape[-1] > 1:
-            # pick the most active channel
-            ch = np.argmax(m.reshape(-1, m.shape[-1]).mean(0))
-            m = m[..., ch]
-        if m.ndim <= 2:
-            break
-    m = m.astype("float32")
-    # if looks like logits -> sigmoid
-    if m.max() > 1.5 or m.min() < -0.5:
-        m = 1.0 / (1.0 + np.exp(-m))
-    return np.clip(m, 0.0, 1.0)
-def _adaptive_threshold(prob: np.ndarray, hard: float = 0.5) -> np.ndarray:
-    if (prob >= hard).sum() > 0:
-        return (prob >= hard).astype("uint8")
-    # try Otsu
-    m8 = (np.clip(prob, 0, 1) * 255).astype("uint8")
-    try:
-        # we only need the threshold value _
-        _, _ = cv2.threshold(m8, 0, 255, cv2.THRESH_BINARY + cv2.THRESH_OTSU)
-        return (m8 >= _).astype("uint8")
-    except Exception:
-        p = float(np.percentile(prob, 99.0))
-        return (prob >= max(0.2, min(0.9, p))).astype("uint8")
-def largest_component_mask(binary: np.ndarray, min_area_px: int = 50) -> np.ndarray:
-    num, labels, stats, _ = cv2.connectedComponentsWithStats(binary.astype(np.uint8), connectivity=8)
     if num <= 1:
-        return binary.astype(np.uint8)
     areas = stats[1:, cv2.CC_STAT_AREA]
     if areas.size == 0 or areas.max() < min_area_px:
-        return binary.astype(np.uint8)
     largest_idx = 1 + int(np.argmax(areas))
     return (labels == largest_idx).astype(np.uint8)
-def measure_min_area_rect(mask: np.ndarray, px_per_cm: float) -> Tuple[float, float, Tuple]:
-    contours, _ = cv2.findContours(mask.astype(np.uint8), cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
     if not contours:
         return 0.0, 0.0, (None, None)
     cnt = max(contours, key=cv2.contourArea)
@@ -373,8 +372,8 @@ def measure_min_area_rect(mask: np.ndarray, px_per_cm: float) -> Tuple[float, fl
     box = cv2.boxPoints(rect).astype(int)
     return length_cm, breadth_cm, (box, rect[0])
-def count_area_cm2(mask: np.ndarray, px_per_cm: float) -> float:
-    px_count = float(mask.astype(bool).sum())
     return round(px_count / (max(px_per_cm, 1e-6) ** 2), 2)
 def draw_measurement_overlay(
@@ -386,13 +385,11 @@ def draw_measurement_overlay(
     thickness: int = 2
 ) -> np.ndarray:
     overlay = base_bgr.copy()
-    # safe blend: blend once, then gate with mask (no mask kwarg!)
-    colored = np.zeros_like(base_bgr); colored[:] = (0, 0, 255)
-    blended = cv2.addWeighted(overlay, 1.0, colored, 0.3, 0)
     m3 = np.dstack([mask01 * 255] * 3).astype("uint8")
-    blended_masked = cv2.bitwise_and(blended, m3)
-    bg = cv2.bitwise_and(overlay, cv2.bitwise_not(m3))
-    overlay = cv2.add(bg, blended_masked)
     if rect_box is not None:
         cv2.polylines(overlay, [rect_box], True, (255, 255, 255), thickness)
@@ -410,15 +407,14 @@ def draw_measurement_overlay(
             cv2.arrowedLine(img, p1, p2, (255, 255, 255), thickness, tipLength=0.05)
             cv2.arrowedLine(img, p2, p1, (255, 255, 255), thickness, tipLength=0.05)
-        draw_arrow(overlay, mids[long_pair[0]], mids[long_pair[1]])
-        draw_arrow(overlay, mids[short_pair[0]], mids[short_pair[1]])
         def put_label(text, org):
             cv2.putText(overlay, text, (org[0] + 4, org[1] - 4),
                         cv2.FONT_HERSHEY_SIMPLEX, 0.7, (0, 0, 0), 4, cv2.LINE_AA)
             cv2.putText(overlay, text, (org[0] + 4, org[1] - 4),
                         cv2.FONT_HERSHEY_SIMPLEX, 0.7, (255, 255, 255), 2, cv2.LINE_AA)
         put_label(f"{length_cm:.2f} cm", mids[long_pair[0]])
         put_label(f"{breadth_cm:.2f} cm", mids[short_pair[0]])
     return overlay
@@ -439,24 +435,20 @@ class AIProcessor:
     def perform_visual_analysis(self, image_pil: Image.Image) -> Dict:
         """
-        Detect → crop ROI → (optional) segment → cleanup → largest component →
-        oriented minAreaRect in cm (EXIF-calibrated) → save original/detect/seg/annotated.
         """
         try:
-            # --- Auto calibration from EXIF ---
             px_per_cm, exif_meta = estimate_px_per_cm_from_exif(image_pil, DEFAULT_PX_PER_CM)
-            # Convert PIL to OpenCV BGR
             image_cv = cv2.cvtColor(np.array(image_pil.convert("RGB")), cv2.COLOR_RGB2BGR)
-            # --- Detection (YOLO) ---
             det_model = self.models_cache.get("det")
             if det_model is None:
                 raise RuntimeError("YOLO model not loaded")
             results = det_model.predict(image_cv, verbose=False, device="cpu")
             if not results or not getattr(results[0], "boxes", None) or len(results[0].boxes) == 0:
-                import gradio as gr  # local import to keep class name intact if gradio missing
                 raise gr.Error("No wound could be detected.")
             box = results[0].boxes[0].xyxy[0].cpu().numpy().astype(int)
@@ -468,36 +460,21 @@ class AIProcessor:
                 import gradio as gr
                 raise gr.Error("Detected ROI is empty.")
-            # --- Segmentation (robust) ---
-            seg_model = self.models_cache.get("seg")
-            mask_roi_01 = None
-            if seg_model is not None:
-                try:
-                    H, W = _get_seg_hw(seg_model)      # robust (H,W)
-                    resized = cv2.resize(roi, (W, H))  # cv2.resize expects (W,H)
-                    pred = seg_model.predict(np.expand_dims(resized / 255.0, 0), verbose=0)
-                    prob = _to_prob(pred)              # (H,W) in [0,1]
-                    binmask = _adaptive_threshold(prob, hard=0.5)
-                    # gentle cleanup + largest component
-                    binmask = cv2.morphologyEx(binmask, cv2.MORPH_OPEN, np.ones((3,3), np.uint8), iterations=1)
-                    binmask = cv2.morphologyEx(binmask, cv2.MORPH_CLOSE, np.ones((3,3), np.uint8), iterations=1)
-                    binmask = largest_component_mask(binmask, min_area_px=30)
-                    # back to ROI size {0,1}
-                    mask_roi_01 = cv2.resize(binmask, (roi.shape[1], roi.shape[0]), interpolation=cv2.INTER_NEAREST).astype(np.uint8)
-                    logging.info(f"seg prob stats: min={prob.min():.4f}, max={prob.max():.4f}, mean={prob.mean():.4f}; on={(mask_roi_01==1).sum()}")
-                except Exception as e:
-                    logging.warning(f"Segmentation failed: {e}")
-                    mask_roi_01 = None
-            else:
-                logging.info("Skipping segmentation (no model).")
             # --- Measurement ---
-            if mask_roi_01 is not None and mask_roi_01.any():
-                length_cm, breadth_cm, (box_pts, _) = measure_min_area_rect(mask_roi_01, px_per_cm)
-                surface_area_cm2 = count_area_cm2(mask_roi_01, px_per_cm)
-                anno_roi = draw_measurement_overlay(roi, mask_roi_01, box_pts, length_cm, breadth_cm)
             else:
-                # fallback to detection-box cm
                 h_px = max(0, y2 - y1); w_px = max(0, x2 - x1)
                 length_cm = round(h_px / px_per_cm, 2)
                 breadth_cm = round(w_px / px_per_cm, 2)
@@ -518,18 +495,14 @@ class AIProcessor:
             segmentation_path = None
             annotated_seg_path = None
-            if mask_roi_01 is not None and mask_roi_01.any():
-                # safe masked blend (no mask kwarg to addWeighted)
                 seg_full = image_cv.copy()
-                roi_overlay = roi.copy()
-                red = np.zeros_like(roi_overlay); red[:] = (0, 0, 255)
-                blended = cv2.addWeighted(roi_overlay, 1.0, red, 0.3, 0)
-                mask_u8 = (mask_roi_01.astype(np.uint8) * 255)
-                mask3 = cv2.merge([mask_u8, mask_u8, mask_u8])
-                blended_masked = cv2.bitwise_and(blended, mask3)
-                roi_bg = cv2.bitwise_and(roi_overlay, cv2.bitwise_not(mask3))
-                roi_overlay = cv2.add(roi_bg, blended_masked)
                 seg_full[y1:y2, x1:x2] = roi_overlay
                 segmentation_path = os.path.join(out_dir, f"segmentation_{ts}.png")
                 cv2.imwrite(segmentation_path, seg_full)
@@ -568,7 +541,7 @@ class AIProcessor:
             logging.error(f"Visual analysis failed: {e}", exc_info=True)
             raise
-    # ---------- Knowledge base and reporting stay unchanged ----------
     def query_guidelines(self, query: str) -> str:
         try:
             vs = self.knowledge_base_cache.get("vector_store")

 # smartheal_ai_processor.py
+# Preserves ALL original class/function names.
+# Changes:
+#  - Adds segment_wound(image) with your logic (+ KMeans fallback)
+#  - perform_visual_analysis() now calls segment_wound() for mask
+#  - Safe overlay (no mask kwarg in addWeighted)
+#  - Conditional @spaces.GPU to avoid cudaGetDeviceCount crash
 import os
 import time
 from datetime import datetime
 from typing import Optional, Dict, List, Tuple
+# Quiet HF tokenizers fork warning
 os.environ.setdefault("TOKENIZERS_PARALLELISM", "false")
 import cv2
 import numpy as np
+from PIL import Image
 from PIL.ExifTags import TAGS
 logging.basicConfig(level=logging.INFO, format="%(asctime)s - %(levelname)s - %(message)s")
 SEG_MODEL_PATH = "src/segmentation_model.h5"   # optional
 GUIDELINE_PDFS = ["src/eHealth in Wound Care.pdf", "src/IWGDF Guideline.pdf", "src/evaluation.pdf"]
 DATASET_ID = "SmartHeal/wound-image-uploads"
+DEFAULT_PX_PER_CM = 38.0
+PX_PER_CM_MIN, PX_PER_CM_MAX = 5.0, 1200.0
 models_cache: Dict[str, object] = {}
 knowledge_base_cache: Dict[str, object] = {}
 def _import_tf_loader():
     import tensorflow as tf
+    tf.config.set_visible_devices([], "GPU")  # force TF CPU
     from tensorflow.keras.models import load_model
     return load_model
     from huggingface_hub import HfApi, HfFolder
     return HfApi, HfFolder
+# ---------- Conditional Spaces GPU wrapper ----------
 def _cuda_available() -> bool:
     try:
         import torch
 ) -> str:
     try:
         from transformers import pipeline
         pipe = pipeline(
             "image-text-to-text",
             model="google/medgemma-4b-it",
         logging.error(f"❌ MedGemma generation error: {e}")
         return "⚠️ GPU/LLM worker unavailable"
 try:
     import spaces
     if _cuda_available():
             image_pil: Image.Image,
             max_new_tokens: Optional[int] = None,
         ) -> str:
             return _generate_medgemma_report_core(patient_info, visual_results, guideline_context, image_pil, max_new_tokens)
 except Exception:
     def generate_medgemma_report(
         f35 = _to_float(exif.get("FocalLengthIn35mmFilm") or exif.get("FocalLengthIn35mm"))
         subj_dist_m = _to_float(exif.get("SubjectDistance"))
         sensor_w_mm = _estimate_sensor_width_mm(f_mm, f35)
         meta.update({"f_mm": f_mm, "f35": f35, "sensor_w_mm": sensor_w_mm, "distance_m": subj_dist_m})
         if f_mm and sensor_w_mm and subj_dist_m and subj_dist_m > 0:
     except Exception:
         return float(default_px_per_cm), meta
+# ---------- Your requested segmentation logic ----------
+def segment_wound(image: np.ndarray) -> np.ndarray:
+    """
+    Segments wound from a preprocessed ROI image, with a fallback to KMeans if the model fails.
+    Returns a mask in 0..255 (uint8), same HxW as input image.
+    """
+    segmentation_model = models_cache.get("seg", None)
+    if segmentation_model is not None:
+        try:
+            input_size = getattr(segmentation_model, "input_shape", None)
+            if input_size is None or len(input_size) < 3:
+                raise ValueError(f"Bad seg input_shape: {input_size}")
+            H, W = int(input_size[1]), int(input_size[2])  # (None,H,W,C)
+            resized = cv2.resize(image, (W, H))                    # cv2 takes (W,H)
+            norm = np.expand_dims(resized / 255.0, axis=0)         # (1,H,W,3)
+            prediction = segmentation_model.predict(norm, verbose=0)
+            # Handle models with multiple outputs
+            if isinstance(prediction, list):
+                prediction = prediction[0]
+            # squeeze batch dim if present
+            prediction = prediction[0] if prediction.ndim >= 3 else prediction
+            # prediction can be (H,W,1) or (H,W)
+            pred2d = prediction.squeeze()
+            mask_prob = cv2.resize(pred2d, (image.shape[1], image.shape[0]))  # back to ROI size
+            mask = (mask_prob >= 0.5).astype(np.uint8) * 255
+            if mask.max() == 0:
+                logging.info("Seg model returned empty mask at 0.5 — keeping as-is (KMeans fallback will handle if needed).")
+            return mask.astype(np.uint8)
+        except Exception as e:
+            logging.warning(f"⚠️ Segmentation model prediction failed: {e}. Falling back to KMeans.")
+    # --- Fallback: color clustering (KMeans, k=2) ---
+    Z = image.reshape((-1, 3)).astype(np.float32)
+    criteria = (cv2.TERM_CRITERIA_EPS + cv2.TERM_CRITERIA_MAX_ITER, 10, 1.0)
+    _K = 2
+    _, labels, centers = cv2.kmeans(Z, _K, None, criteria, 5, cv2.KMEANS_PP_CENTERS)
+    centers = centers.astype(np.uint8).reshape(1, _K, 3)
+    centers_lab = cv2.cvtColor(centers, cv2.COLOR_BGR2LAB)[0]
+    wound_idx = int(np.argmax(centers_lab[:, 1]))  # reddest cluster (a* channel)
+    mask = (labels.reshape(image.shape[:2]) == wound_idx).astype(np.uint8) * 255
+    return mask.astype(np.uint8)
+# ---------- Measurement + overlay helpers ----------
+def largest_component_mask(binary01: np.ndarray, min_area_px: int = 50) -> np.ndarray:
+    num, labels, stats, _ = cv2.connectedComponentsWithStats(binary01.astype(np.uint8), connectivity=8)
     if num <= 1:
+        return binary01.astype(np.uint8)
     areas = stats[1:, cv2.CC_STAT_AREA]
     if areas.size == 0 or areas.max() < min_area_px:
+        return binary01.astype(np.uint8)
     largest_idx = 1 + int(np.argmax(areas))
     return (labels == largest_idx).astype(np.uint8)
+def measure_min_area_rect(mask01: np.ndarray, px_per_cm: float) -> Tuple[float, float, Tuple]:
+    contours, _ = cv2.findContours(mask01.astype(np.uint8), cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
     if not contours:
         return 0.0, 0.0, (None, None)
     cnt = max(contours, key=cv2.contourArea)
     box = cv2.boxPoints(rect).astype(int)
     return length_cm, breadth_cm, (box, rect[0])
+def count_area_cm2(mask01: np.ndarray, px_per_cm: float) -> float:
+    px_count = float(mask01.astype(bool).sum())
     return round(px_count / (max(px_per_cm, 1e-6) ** 2), 2)
 def draw_measurement_overlay(
     thickness: int = 2
 ) -> np.ndarray:
     overlay = base_bgr.copy()
+    red = np.zeros_like(overlay); red[:] = (0, 0, 255)
+    blended = cv2.addWeighted(overlay, 1.0, red, 0.3, 0)
     m3 = np.dstack([mask01 * 255] * 3).astype("uint8")
+    overlay = cv2.add(cv2.bitwise_and(overlay, cv2.bitwise_not(m3)),
+                      cv2.bitwise_and(blended, m3))
     if rect_box is not None:
         cv2.polylines(overlay, [rect_box], True, (255, 255, 255), thickness)
             cv2.arrowedLine(img, p1, p2, (255, 255, 255), thickness, tipLength=0.05)
             cv2.arrowedLine(img, p2, p1, (255, 255, 255), thickness, tipLength=0.05)
         def put_label(text, org):
             cv2.putText(overlay, text, (org[0] + 4, org[1] - 4),
                         cv2.FONT_HERSHEY_SIMPLEX, 0.7, (0, 0, 0), 4, cv2.LINE_AA)
             cv2.putText(overlay, text, (org[0] + 4, org[1] - 4),
                         cv2.FONT_HERSHEY_SIMPLEX, 0.7, (255, 255, 255), 2, cv2.LINE_AA)
+        draw_arrow(overlay, mids[long_pair[0]], mids[long_pair[1]])
+        draw_arrow(overlay, mids[short_pair[0]], mids[short_pair[1]])
         put_label(f"{length_cm:.2f} cm", mids[long_pair[0]])
         put_label(f"{breadth_cm:.2f} cm", mids[short_pair[0]])
     return overlay
     def perform_visual_analysis(self, image_pil: Image.Image) -> Dict:
         """
+        YOLO detect → crop ROI → segment_wound(ROI) → largest component →
+        minAreaRect measurement (cm) using EXIF px/cm → save outputs.
         """
         try:
             px_per_cm, exif_meta = estimate_px_per_cm_from_exif(image_pil, DEFAULT_PX_PER_CM)
             image_cv = cv2.cvtColor(np.array(image_pil.convert("RGB")), cv2.COLOR_RGB2BGR)
+            # --- Detection ---
             det_model = self.models_cache.get("det")
             if det_model is None:
                 raise RuntimeError("YOLO model not loaded")
             results = det_model.predict(image_cv, verbose=False, device="cpu")
             if not results or not getattr(results[0], "boxes", None) or len(results[0].boxes) == 0:
+                import gradio as gr
                 raise gr.Error("No wound could be detected.")
             box = results[0].boxes[0].xyxy[0].cpu().numpy().astype(int)
                 import gradio as gr
                 raise gr.Error("Detected ROI is empty.")
+            # --- Segmentation (your logic + fallback) ---
+            mask_u8_255 = segment_wound(roi)               # 0..255
+            # Clean up & keep largest component (in 0/1)
+            mask01 = (mask_u8_255 > 127).astype(np.uint8)
+            mask01 = cv2.morphologyEx(mask01, cv2.MORPH_OPEN, np.ones((3,3), np.uint8), iterations=1)
+            mask01 = cv2.morphologyEx(mask01, cv2.MORPH_CLOSE, np.ones((3,3), np.uint8), iterations=1)
+            mask01 = largest_component_mask(mask01, min_area_px=30)
             # --- Measurement ---
+            if mask01.any():
+                length_cm, breadth_cm, (box_pts, _) = measure_min_area_rect(mask01, px_per_cm)
+                surface_area_cm2 = count_area_cm2(mask01, px_per_cm)
+                anno_roi = draw_measurement_overlay(roi, mask01, box_pts, length_cm, breadth_cm)
             else:
+                # fallback to detection box
                 h_px = max(0, y2 - y1); w_px = max(0, x2 - x1)
                 length_cm = round(h_px / px_per_cm, 2)
                 breadth_cm = round(w_px / px_per_cm, 2)
             segmentation_path = None
             annotated_seg_path = None
+            if mask01.any():
                 seg_full = image_cv.copy()
+                # safe masked blend (no mask kwarg)
+                red = np.zeros_like(roi); red[:] = (0, 0, 255)
+                blended = cv2.addWeighted(roi, 1.0, red, 0.3, 0)
+                m3 = np.dstack([mask01 * 255] * 3).astype("uint8")
+                roi_overlay = cv2.add(cv2.bitwise_and(roi, cv2.bitwise_not(m3)),
+                                      cv2.bitwise_and(blended, m3))
                 seg_full[y1:y2, x1:x2] = roi_overlay
                 segmentation_path = os.path.join(out_dir, f"segmentation_{ts}.png")
                 cv2.imwrite(segmentation_path, seg_full)
             logging.error(f"Visual analysis failed: {e}", exc_info=True)
             raise
+    # ---------- Knowledge base + reporting (unchanged names) ----------
     def query_guidelines(self, query: str) -> str:
         try:
             vs = self.knowledge_base_cache.get("vector_store")