Spaces:

NextDrought
/

ForestAI-TreeExtraction

Running

App Files Files Community

DynamicPacific commited on Jun 17

Commit

4b38b88

1 Parent(s): 4d1ea90

Add essential files for HF deployment

Browse files

Files changed (21) hide show

README.md +40 -0
app.py +393 -0
example.tif +3 -0
packages.txt +7 -0
requirements.txt +12 -0
utils/__init__.py +1 -0
utils/__pycache__/__init__.cpython-310.pyc +0 -0
utils/__pycache__/__init__.cpython-312.pyc +0 -0
utils/__pycache__/advanced_extraction.cpython-310.pyc +0 -0
utils/__pycache__/advanced_extraction.cpython-312.pyc +0 -0
utils/__pycache__/geospatial.cpython-310.pyc +0 -0
utils/__pycache__/geospatial.cpython-312.pyc +0 -0
utils/__pycache__/image_processing.cpython-310.pyc +0 -0
utils/__pycache__/image_processing.cpython-312.pyc +0 -0
utils/__pycache__/segmentation.cpython-310.pyc +0 -0
utils/__pycache__/segmentation.cpython-312.pyc +0 -0
utils/advanced_extraction.py +86 -0
utils/geo_processing.py +111 -0
utils/geospatial.py +502 -0
utils/image_processing.py +68 -0
utils/segmentation.py +237 -0

README.md ADDED Viewed

	@@ -0,0 +1,40 @@

+---
+title: ForestAI Tree Detection
+emoji: 🌲
+colorFrom: green
+colorTo: yellow
+sdk: gradio
+sdk_version: 4.0.0
+app_file: app.py
+pinned: false
+license: mit
+---
+# ForestAI - Tree Detection from Satellite Imagery
+Upload a GeoTIFF file to detect and map trees using AI-powered imagery analysis. This application provides:
+- 🌲 Automated tree detection from satellite imagery
+- 🗺️ Interactive split-view map visualization
+- 📊 Feature extraction and analysis
+- 🎯 Multiple feature types (trees, buildings, water, roads)
+## How to Use
+1. Upload a GeoTIFF file
+2. Select feature type to detect
+3. Click "Analyze Image"
+4. Explore the interactive split-view map
+5. Use the slider to compare base map and satellite imagery
+## Technology
+Built with:
+- Gradio for the web interface
+- GeoPandas and Rasterio for geospatial processing
+- Folium for interactive mapping
+- AI-powered feature extraction algorithms
+## Migration Notes
+This version has been migrated and optimized from a local development version for Hugging Face Spaces deployment while preserving core functionality.

app.py ADDED Viewed

	@@ -0,0 +1,393 @@

+import os
+import gradio as gr
+import folium
+from folium import plugins
+import geopandas as gpd
+import rasterio
+from rasterio.warp import transform_bounds
+import json
+import tempfile
+import shutil
+import uuid
+import logging
+import traceback
+import numpy as np
+from PIL import Image
+# Configure logging for HF Spaces
+logging.basicConfig(
+    level=logging.INFO,
+    format='%(asctime)s - %(name)s - %(levelname)s - %(message)s',
+    handlers=[logging.StreamHandler()]
+)
+logger = logging.getLogger('forestai')
+# ================================
+# CONFIGURATIONS
+# ================================
+# Feature styles for trees only
+FEATURE_STYLES = {
+    'trees': {"color": "green", "fillColor": "yellow", "fillOpacity": 0.3, "weight": 2}
+}
+# Example file path
+EXAMPLE_FILE_PATH = "example.tif"
+# ================================
+# TEMP DIRECTORY SETUP
+# ================================
+def setup_temp_dirs():
+    """Create temporary directories."""
+    temp_base = tempfile.mkdtemp(prefix="forestai_")
+    dirs = {
+        'uploads': os.path.join(temp_base, 'uploads'),
+        'processed': os.path.join(temp_base, 'processed'),
+        'static': os.path.join(temp_base, 'static')
+    }
+    for dir_path in dirs.values():
+        os.makedirs(dir_path, exist_ok=True)
+    return dirs
+# Global temp directories
+TEMP_DIRS = setup_temp_dirs()
+# ================================
+# CORE FUNCTIONS
+# ================================
+def get_bounds_from_geotiff(geotiff_path):
+    """Extract bounds from GeoTIFF and convert to WGS84."""
+    try:
+        with rasterio.open(geotiff_path) as src:
+            bounds = src.bounds
+            if src.crs:
+                west, south, east, north = transform_bounds(
+                    src.crs, 'EPSG:4326',
+                    bounds.left, bounds.bottom, bounds.right, bounds.top
+                )
+                return west, south, east, north
+            else:
+                return -74.1, 40.6, -73.9, 40.8
+    except Exception as e:
+        logger.error(f"Error extracting bounds: {str(e)}")
+        return -74.1, 40.6, -73.9, 40.8
+def create_split_view_map(geojson_data, bounds):
+    """Create split-view map with detected trees."""
+    try:
+        west, south, east, north = bounds
+        center = [(south + north) / 2, (west + east) / 2]
+        # Calculate zoom level
+        lat_diff = north - south
+        lon_diff = east - west
+        max_diff = max(lat_diff, lon_diff)
+        if max_diff < 0.01:
+            zoom = 16
+        elif max_diff < 0.05:
+            zoom = 14
+        elif max_diff < 0.1:
+            zoom = 12
+        else:
+            zoom = 10
+        # Create base map
+        m = folium.Map(location=center, zoom_start=zoom)
+        # Create tile layers
+        left_layer = folium.TileLayer(
+            tiles='OpenStreetMap',
+            name='OpenStreetMap',
+            overlay=False,
+            control=False
+        )
+        right_layer = folium.TileLayer(
+            tiles='https://server.arcgisonline.com/ArcGIS/rest/services/World_Imagery/MapServer/tile/{z}/{y}/{x}',
+            attr='Esri',
+            name='Satellite',
+            overlay=False,
+            control=False
+        )
+        left_layer.add_to(m)
+        right_layer.add_to(m)
+        # Add detected trees
+        if geojson_data and 'features' in geojson_data and geojson_data['features']:
+            style = FEATURE_STYLES['trees']
+            geojson_layer = folium.GeoJson(
+                geojson_data,
+                name='Detected Trees',
+                style_function=lambda x: style,
+                popup=folium.GeoJsonPopup(
+                    fields=['confidence'] if 'confidence' in str(geojson_data) else [],
+                    aliases=['Confidence:'] if 'confidence' in str(geojson_data) else [],
+                    localize=True
+                )
+            )
+            geojson_layer.add_to(m)
+        # Add split view plugin
+        plugins.SideBySideLayers(
+            layer_left=left_layer,
+            layer_right=right_layer
+        ).add_to(m)
+        # Add layer control
+        folium.LayerControl().add_to(m)
+        # Fit bounds
+        m.fit_bounds([[south, west], [north, east]], padding=(20, 20))
+        return m
+    except Exception as e:
+        logger.error(f"Error creating map: {str(e)}")
+        # Return basic map on error
+        m = folium.Map(location=[40.7, -74.0], zoom_start=10)
+        return m
+def process_geotiff_file(geotiff_file):
+    """Process uploaded GeoTIFF file for tree detection."""
+    if geotiff_file is None:
+        return None, "Please upload a GeoTIFF file or use the example file"
+    try:
+        # Create unique ID
+        unique_id = str(uuid.uuid4().hex)[:8]
+        # Handle file upload
+        if hasattr(geotiff_file, 'name'):
+            filename = os.path.basename(geotiff_file.name)
+        else:
+            filename = os.path.basename(geotiff_file)
+        # Save uploaded file
+        geotiff_path = os.path.join(TEMP_DIRS['uploads'], f"{unique_id}_{filename}")
+        if hasattr(geotiff_file, 'read'):
+            file_content = geotiff_file.read()
+            with open(geotiff_path, "wb") as f:
+                f.write(file_content)
+        else:
+            shutil.copy(geotiff_file, geotiff_path)
+        logger.info(f"File saved to {geotiff_path}")
+        # Import and extract features
+        from utils.advanced_extraction import extract_features_from_geotiff
+        logger.info("Extracting tree features...")
+        geojson_data = extract_features_from_geotiff(geotiff_path, TEMP_DIRS['processed'], "trees")
+        if not geojson_data or not geojson_data.get('features'):
+            return None, "No trees detected in the image"
+        # Get bounds and create map
+        bounds = get_bounds_from_geotiff(geotiff_path)
+        map_obj = create_split_view_map(geojson_data, bounds)
+        if map_obj:
+            # Save map
+            html_path = os.path.join(TEMP_DIRS['static'], f"map_{unique_id}.html")
+            map_obj.save(html_path)
+            # Read HTML content
+            with open(html_path, 'r', encoding='utf-8') as f:
+                html_content = f.read()
+            # Create iframe
+            iframe_html = f'''
+            <div style="width:100%; height:600px; border:1px solid #ddd; border-radius:8px; overflow:hidden;">
+                <iframe srcdoc="{html_content.replace('"', '&quot;')}"
+                        width="100%" height="600px" style="border:none;"></iframe>
+            </div>
+            '''
+            num_features = len(geojson_data['features'])
+            return iframe_html, f"✅ Detected {num_features} tree areas in {filename}"
+        else:
+            return None, "Failed to create map"
+    except Exception as e:
+        logger.error(f"Error processing file: {str(e)}")
+        return None, f"❌ Error: {str(e)}"
+def load_example_file():
+    """Load the example.tif file and return it for processing."""
+    try:
+        if os.path.exists(EXAMPLE_FILE_PATH):
+            logger.info("Loading example file...")
+            return EXAMPLE_FILE_PATH
+        else:
+            logger.warning("Example file not found")
+            return None
+    except Exception as e:
+        logger.error(f"Error loading example file: {str(e)}")
+        return None
+def process_example_file():
+    """Process the example file and return results."""
+    example_file = load_example_file()
+    if example_file:
+        return process_geotiff_file(example_file)
+    else:
+        return None, "❌ Example file (example.tif) not found in the root directory"
+def check_example_file_exists():
+    """Check if example file exists and return appropriate message."""
+    if os.path.exists(EXAMPLE_FILE_PATH):
+        return f"✅ Example file found: {EXAMPLE_FILE_PATH}"
+    else:
+        return f"⚠️ Example file not found: {EXAMPLE_FILE_PATH}"
+# ================================
+# GRADIO INTERFACE
+# ================================
+def create_gradio_interface():
+    """Create the Gradio interface for tree detection."""
+    css = """
+    .gradio-container {
+        max-width: 100% !important;
+        width: 100% !important;
+        margin: 0 !important;
+        padding: 10px !important;
+    }
+    .map-container {
+        border-radius: 8px;
+        overflow: hidden;
+        box-shadow: 0 4px 6px rgba(0, 0, 0, 0.1);
+        width: 100% !important;
+    }
+    body {
+        margin: 0 !important;
+        padding: 0 !important;
+    }
+    .contain {
+        max-width: none !important;
+        padding: 0 !important;
+    }
+    .example-button {
+        background: linear-gradient(135deg, #28a745 0%, #20c997 100%) !important;
+        border: none !important;
+        color: white !important;
+    }
+    """
+    with gr.Blocks(title="🌲 ForestAI - Tree Detection", css=css, theme=gr.themes.Soft()) as app:
+        # Simple header
+        gr.HTML("""
+        <div style="text-align: center; padding: 20px; background: linear-gradient(135deg, #667eea 0%, #764ba2 100%); border-radius: 10px; margin-bottom: 20px;">
+            <h1 style="color: white; margin: 0; font-size: 2.5em;">🌲 ForestAI</h1>
+            <p style="color: white; margin: 10px 0 0 0; font-size: 1.2em;">Tree Detection from Satellite Imagery</p>
+        </div>
+        """)
+        with gr.Row():
+            with gr.Column(scale=1):
+                gr.Markdown("### Upload GeoTIFF File")
+                file_input = gr.File(
+                    label="Select GeoTIFF File",
+                    file_types=[".tif", ".tiff"],
+                    type="filepath"
+                )
+                with gr.Row():
+                    analyze_btn = gr.Button(
+                        "🔍 Detect Trees",
+                        variant="primary",
+                        size="lg",
+                        scale=2
+                    )
+                    example_btn = gr.Button(
+                        "📁 Use Example File",
+                        variant="secondary",
+                        size="lg",
+                        scale=1,
+                        elem_classes=["example-button"]
+                    )
+                # Example file status
+                example_status = gr.Textbox(
+                    label="Example File Status",
+                    value=check_example_file_exists(),
+                    interactive=False,
+                    lines=1
+                )
+                gr.Markdown("### Status")
+                status_output = gr.Textbox(
+                    label="Processing Status",
+                    interactive=False,
+                    placeholder="Upload a file and click 'Detect Trees' or use the example file...",
+                    lines=3
+                )
+            with gr.Column(scale=2):
+                gr.Markdown("### Results Map")
+                map_output = gr.HTML(
+                    value='''
+                    <div style="width:100%; height:600px; border:1px solid #ddd; border-radius:8px;
+                                display:flex; align-items:center; justify-content:center;
+                                background: linear-gradient(135deg, #f5f7fa 0%, #c3cfe2 100%);">
+                        <div style="text-align:center; color:#666;">
+                            <h3>🌲 Upload a GeoTIFF file or use example to see detected trees</h3>
+                            <p>Interactive map will appear here</p>
+                        </div>
+                    </div>
+                    ''',
+                    elem_classes=["map-container"]
+                )
+        # Event handlers
+        analyze_btn.click(
+            fn=process_geotiff_file,
+            inputs=[file_input],
+            outputs=[map_output, status_output],
+            show_progress=True
+        )
+        example_btn.click(
+            fn=process_example_file,
+            inputs=[],
+            outputs=[map_output, status_output],
+            show_progress=True
+        )
+        # Simple instructions
+        gr.Markdown("""
+        ### How to Use:
+        1. **Upload** a GeoTIFF satellite image file OR click "Use Example File" to try with the included sample
+        2. **Click** "Detect Trees" to analyze your uploaded image
+        3. **Explore** the interactive map with detected tree areas
+        4. **Use** the split-view slider to compare base map and satellite imagery
+        ### Map Controls:
+        - **Split View**: Drag the vertical slider to compare layers
+        - **Zoom**: Scroll to zoom in/out, drag to pan
+        - **Layers**: Use layer control to toggle trees on/off
+        ### Example File:
+        - The example file should be named `example.tif` and placed in the same directory as this application
+        - Click "Use Example File" to quickly test the tree detection without uploading your own file
+        """)
+    return app
+if __name__ == "__main__":
+    logger.info("🌲 Starting ForestAI Tree Detection")
+    app = create_gradio_interface()
+    app.launch()

example.tif ADDED Viewed

Git LFS Details

SHA256: ba9abc7060c9c7faf5336e31dfae041304b63cfdb36709bc6b2ccc6cb33ee29a
Pointer size: 132 Bytes
Size of remote file: 4.12 MB

packages.txt ADDED Viewed

	@@ -0,0 +1,7 @@

+gdal-bin
+libgdal-dev
+libproj-dev
+libgeos-dev
+libspatialindex-dev
+libspatialite7
+libsqlite3-mod-spatialite

requirements.txt ADDED Viewed

	@@ -0,0 +1,12 @@

+gradio>=4.0.0
+folium>=0.14.0
+geopandas>=0.14.0
+rasterio>=1.3.0
+numpy>=1.24.0
+Pillow>=10.0.0
+shapely>=2.0.0
+pyproj>=3.6.0
+fiona>=1.9.0
+matplotlib>=3.7.0
+pandas>=2.0.0
+scipy>=1.11.0

utils/__init__.py ADDED Viewed

	@@ -0,0 +1 @@


1	+ # This file is intentionally left empty to make the utils directory a Python package

utils/__pycache__/__init__.cpython-310.pyc ADDED Viewed

Binary file (168 Bytes). View file

utils/__pycache__/__init__.cpython-312.pyc ADDED Viewed

Binary file (142 Bytes). View file

utils/__pycache__/advanced_extraction.cpython-310.pyc ADDED Viewed

Binary file (2.03 kB). View file

utils/__pycache__/advanced_extraction.cpython-312.pyc ADDED Viewed

Binary file (9.56 kB). View file

utils/__pycache__/geospatial.cpython-310.pyc ADDED Viewed

Binary file (11.9 kB). View file

utils/__pycache__/geospatial.cpython-312.pyc ADDED Viewed

Binary file (18.8 kB). View file

utils/__pycache__/image_processing.cpython-310.pyc ADDED Viewed

Binary file (1.76 kB). View file

utils/__pycache__/image_processing.cpython-312.pyc ADDED Viewed

Binary file (2.87 kB). View file

utils/__pycache__/segmentation.cpython-310.pyc ADDED Viewed

Binary file (5.81 kB). View file

utils/__pycache__/segmentation.cpython-312.pyc ADDED Viewed

Binary file (8.92 kB). View file

utils/advanced_extraction.py ADDED Viewed

	@@ -0,0 +1,86 @@

+import os
+import logging
+import numpy as np
+import rasterio
+from rasterio.warp import transform_bounds
+def extract_features_from_geotiff(image_path, output_folder, feature_type="trees"):
+    """Simple feature extraction for HF Spaces."""
+    try:
+        logging.info(f"Extracting {feature_type} from {image_path}")
+        with rasterio.open(image_path) as src:
+            # Simple NDVI calculation
+            if src.count >= 3:
+                red = src.read(1).astype(float)
+                green = src.read(2).astype(float)
+                nir = src.read(4).astype(float) if src.count >= 4 else green
+                ndvi = np.divide(nir - red, nir + red + 1e-10)
+                mask = ndvi > 0.2
+            else:
+                band = src.read(1)
+                mask = band > np.percentile(band, 60)
+            # Get bounds
+            bounds = src.bounds
+            if src.crs:
+                west, south, east, north = transform_bounds(
+                    src.crs, 'EPSG:4326',
+                    bounds.left, bounds.bottom, bounds.right, bounds.top
+                )
+            else:
+                west, south, east, north = -74.1, 40.6, -73.9, 40.8
+        # Create simple features
+        features = []
+        height, width = mask.shape
+        grid_size = max(10, min(height, width) // 50)
+        feature_id = 0
+        for y in range(0, height, grid_size):
+            for x in range(0, width, grid_size):
+                cell = mask[y:y+grid_size, x:x+grid_size]
+                if np.sum(cell) > grid_size * grid_size * 0.3:
+                    x_ratio = x / width
+                    y_ratio = y / height
+                    lon1 = west + x_ratio * (east - west)
+                    lat1 = north - y_ratio * (north - south)
+                    x2_ratio = min((x + grid_size) / width, 1.0)
+                    y2_ratio = min((y + grid_size) / height, 1.0)
+                    lon2 = west + x2_ratio * (east - west)
+                    lat2 = north - y2_ratio * (north - south)
+                    polygon_coords = [
+                        [lon1, lat1], [lon2, lat1], [lon2, lat2], [lon1, lat2], [lon1, lat1]
+                    ]
+                    feature = {
+                        "type": "Feature",
+                        "id": feature_id,
+                        "properties": {
+                            "feature_type": feature_type,
+                            "confidence": 0.8
+                        },
+                        "geometry": {
+                            "type": "Polygon",
+                            "coordinates": [polygon_coords]
+                        }
+                    }
+                    features.append(feature)
+                    feature_id += 1
+        return {
+            "type": "FeatureCollection",
+            "features": features,
+            "feature_type": feature_type
+        }
+    except Exception as e:
+        logging.error(f"Error extracting features: {str(e)}")
+        return {"type": "FeatureCollection", "features": []}

utils/geo_processing.py ADDED Viewed

	@@ -0,0 +1,111 @@

+import os
+import logging
+import uuid
+import numpy as np
+from PIL import Image
+import json
+# Try to import GDAL, but provide fallback for environments without it
+try:
+    from osgeo import gdal, ogr, osr
+    HAS_GDAL = True
+except ImportError:
+    logging.warning("GDAL not available. Using simplified GeoJSON conversion.")
+    HAS_GDAL = False
+def convert_to_geojson(image_path):
+    """
+    Convert a processed image to GeoJSON format.
+    This function extracts features from the processed image and converts them
+    to GeoJSON polygons or linestrings.
+    Args:
+        image_path (str): Path to the processed image
+    Returns:
+        dict: GeoJSON object
+    """
+    try:
+        logging.info(f"Converting image to GeoJSON: {image_path}")
+        # Open the image
+        img = Image.open(image_path)
+        img_array = np.array(img)
+        # Create a simple GeoJSON structure
+        geojson = {
+            "type": "FeatureCollection",
+            "features": []
+        }
+        # Extract contours from the image
+        # In a real application, we would use OpenCV's findContours here
+        # Since we're simulating it, we'll create a simplified process
+        height, width = img_array.shape
+        # Create a random bounding box as a demo
+        # In a real application, this would be based on actual image analysis
+        feature_id = 0
+        # Process the image to find contours
+        # (For simplicity, we'll simulate finding features by looking at non-zero pixels)
+        visited = np.zeros_like(img_array, dtype=bool)
+        for y in range(0, height, 10):  # Step by 10 for performance
+            for x in range(0, width, 10):  # Step by 10 for performance
+                if img_array[y, x] > 0 and not visited[y, x]:
+                    # Found a feature, trace its boundary
+                    feature_id += 1
+                    # Simplified feature extraction - in a real app this would be more sophisticated
+                    # Here we'll just create a small polygon around the point
+                    coords = []
+                    size = min(20, min(width-x, height-y))
+                    # Create a simple polygon
+                    polygon = [
+                        [x, y],
+                        [x + size, y],
+                        [x + size, y + size],
+                        [x, y + size],
+                        [x, y]  # Close the polygon
+                    ]
+                    # Convert pixel coordinates to approximate geo-coordinates
+                    # In a real application, this would use proper geo-referencing
+                    # Here we'll just normalize to [0,1] range and then to fake lat/long
+                    geo_polygon = []
+                    for px, py in polygon:
+                        # Convert to fake geographic coordinates (for demo purposes)
+                        lon = (px / width) * 0.1 - 74.0  # Fake longitude centered around New York
+                        lat = (py / height) * 0.1 + 40.7  # Fake latitude centered around New York
+                        geo_polygon.append([lon, lat])
+                    # Add the feature to GeoJSON
+                    feature = {
+                        "type": "Feature",
+                        "id": feature_id,
+                        "properties": {
+                            "name": f"Feature {feature_id}",
+                            "value": int(img_array[y, x])
+                        },
+                        "geometry": {
+                            "type": "Polygon",
+                            "coordinates": [geo_polygon]
+                        }
+                    }
+                    geojson["features"].append(feature)
+                    # Mark this area as visited
+                    for cy in range(y, min(y + size, height)):
+                        for cx in range(x, min(x + size, width)):
+                            visited[cy, cx] = True
+        logging.info(f"Converted image to GeoJSON with {feature_id} features")
+        return geojson
+    except Exception as e:
+        logging.error(f"Error in GeoJSON conversion: {str(e)}")
+        # Return a minimal valid GeoJSON if there's an error
+        return {"type": "FeatureCollection", "features": []}

utils/geospatial.py ADDED Viewed

	@@ -0,0 +1,502 @@

+"""
+Geospatial utilities for image processing and GeoJSON generation.
+This module adapts techniques from the geoai library for better polygon generation
+with simplified dependencies.
+"""
+import os
+import logging
+import uuid
+import numpy as np
+import cv2
+from PIL import Image, TiffTags, TiffImagePlugin
+import json
+import re
+from shapely.geometry import Polygon, MultiPolygon, mapping
+from shapely import ops
+def extract_contours(image_path, min_area=50, epsilon_factor=0.002):
+    """
+    Extract contours from an image and convert them to polygons.
+    Uses OpenCV's contour detection with douglas-peucker simplification.
+    Args:
+        image_path (str): Path to the processed image
+        min_area (int): Minimum contour area to keep
+        epsilon_factor (float): Simplification factor for douglas-peucker algorithm
+    Returns:
+        list: List of polygon objects
+    """
+    try:
+        # Read the image
+        img = cv2.imread(image_path, cv2.IMREAD_GRAYSCALE)
+        if img is None:
+            # Try using PIL if OpenCV fails
+            pil_img = Image.open(image_path).convert('L')
+            img = np.array(pil_img)
+        # Apply threshold if needed
+        _, thresh = cv2.threshold(img, 127, 255, cv2.THRESH_BINARY)
+        # Find contours
+        contours, _ = cv2.findContours(thresh, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
+        polygons = []
+        for contour in contours:
+            # Filter small contours
+            area = cv2.contourArea(contour)
+            if area < min_area:
+                continue
+            # Apply Douglas-Peucker algorithm to simplify contours
+            epsilon = epsilon_factor * cv2.arcLength(contour, True)
+            approx = cv2.approxPolyDP(contour, epsilon, True)
+            # Convert to polygon
+            if len(approx) >= 3:  # At least 3 points needed for a polygon
+                polygon_points = []
+                for point in approx:
+                    x, y = point[0]
+                    polygon_points.append((float(x), float(y)))
+                # Create a valid polygon (close it if needed)
+                if polygon_points[0] != polygon_points[-1]:
+                    polygon_points.append(polygon_points[0])
+                # Create shapely polygon
+                polygon = Polygon(polygon_points)
+                if polygon.is_valid:
+                    polygons.append(polygon)
+        return polygons
+    except Exception as e:
+        logging.error(f"Error extracting contours: {str(e)}")
+        return []
+def simplify_polygons(polygons, tolerance=1.0):
+    """
+    Apply polygon simplification to reduce the number of vertices.
+    Args:
+        polygons (list): List of shapely Polygon objects
+        tolerance (float): Simplification tolerance
+    Returns:
+        list: List of simplified polygons
+    """
+    simplified = []
+    for polygon in polygons:
+        # Apply simplification
+        simp = polygon.simplify(tolerance, preserve_topology=True)
+        if simp.is_valid and not simp.is_empty:
+            simplified.append(simp)
+    return simplified
+def regularize_polygons(polygons):
+    """
+    Regularize polygons to make them more rectangular when appropriate.
+    Args:
+        polygons (list): List of shapely Polygon objects
+    Returns:
+        list: List of regularized polygons
+    """
+    regularized = []
+    for polygon in polygons:
+        try:
+            # Check if the polygon is roughly rectangular using a simple heuristic
+            bounds = polygon.bounds
+            width = bounds[2] - bounds[0]
+            height = bounds[3] - bounds[1]
+            area_ratio = polygon.area / (width * height)
+            # If it's at least 80% similar to a rectangle, make it rectangular
+            if area_ratio > 0.8:
+                # Replace with the minimum bounding rectangle
+                minx, miny, maxx, maxy = polygon.bounds
+                regularized.append(Polygon([
+                    (minx, miny), (maxx, miny),
+                    (maxx, maxy), (minx, maxy), (minx, miny)
+                ]))
+            else:
+                regularized.append(polygon)
+        except Exception as e:
+            logging.warning(f"Error regularizing polygon: {str(e)}")
+            regularized.append(polygon)
+    return regularized
+def merge_nearby_polygons(polygons, distance_threshold=5.0):
+    """
+    Merge polygons that are close to each other to reduce the polygon count.
+    Args:
+        polygons (list): List of shapely Polygon objects
+        distance_threshold (float): Distance threshold for merging
+    Returns:
+        list: List of merged polygons
+    """
+    if not polygons:
+        return []
+    # Buffer polygons slightly to create overlaps for nearby polygons
+    buffered = [polygon.buffer(distance_threshold) for polygon in polygons]
+    # Union all buffered polygons
+    union = ops.unary_union(buffered)
+    # Convert the result to a list of polygons
+    if isinstance(union, Polygon):
+        return [union]
+    elif isinstance(union, MultiPolygon):
+        return list(union.geoms)
+    else:
+        return []
+def extract_geo_coordinates_from_image(image_path):
+    """
+    Extract geographic coordinates from image metadata (EXIF, GeoTIFF).
+    Uses rasterio for more reliable GeoTIFF handling.
+    Args:
+        image_path (str): Path to the image file
+    Returns:
+        tuple: (min_lat, min_lon, max_lat, max_lon) or None if not found
+    """
+    try:
+        # First try using rasterio for GeoTIFF files
+        if image_path.lower().endswith(('.tif', '.tiff')):
+            try:
+                import rasterio
+                from rasterio.warp import transform_bounds
+                logging.info(f"Using rasterio to extract coordinates from {image_path}")
+                with rasterio.open(image_path) as src:
+                    # Check if the file has a valid CRS
+                    if src.crs is not None:
+                        # Get bounds in the source CRS
+                        bounds = src.bounds
+                        # Transform bounds to WGS84 (lat/lon)
+                        if src.crs.to_epsg() != 4326:
+                            west, south, east, north = transform_bounds(
+                                src.crs, 'EPSG:4326',
+                                bounds.left, bounds.bottom, bounds.right, bounds.top
+                            )
+                        else:
+                            west, south, east, north = bounds
+                        logging.info(f"Extracted coordinates from GeoTIFF: {west},{south} to {east},{north}")
+                        return south, west, north, east  # min_lat, min_lon, max_lat, max_lon
+            except Exception as e:
+                logging.warning(f"Rasterio extraction failed: {str(e)}, falling back to PIL")
+        # Fallback to PIL for other image types or if rasterio fails
+        img = Image.open(image_path)
+        # Check if it's a TIFF image with geospatial data
+        if hasattr(img, 'tag') and img.tag:
+            logging.info(f"Detected image with tags, checking for geospatial metadata")
+            # Try to extract ModelPixelScaleTag (33550) and ModelTiepointTag (33922)
+            pixel_scale_tag = None
+            tiepoint_tag = None
+            # Check for tags
+            tag_dict = img.tag.items() if hasattr(img.tag, 'items') else {}
+            # Remove hardcoded Brazil detection
+            is_brazil_image = False
+            if not tag_dict and is_brazil_image:
+                logging.info(f"Special case for Brazil image detected in: {image_path}")
+                # Hard code Brazil coordinates for the specific sample
+                # These coordinates are for the Brazil sample from the GeoAI notebook
+                # Rio de Janeiro area (near Tijuca Forest)
+                min_lat = -22.96  # Southern Brazil
+                min_lon = -43.38
+                max_lat = -22.94
+                max_lon = -43.36
+                logging.info(f"Using known Brazil coordinates: {min_lon},{min_lat} to {max_lon},{max_lat}")
+                return min_lat, min_lon, max_lat, max_lon
+            for tag_id, value in tag_dict:
+                tag_name = TiffTags.TAGS.get(tag_id, str(tag_id))
+                logging.debug(f"TIFF tag: {tag_name} ({tag_id}): {value}")
+                if tag_id == 33550:  # ModelPixelScaleTag
+                    pixel_scale_tag = value
+                elif tag_id == 33922:  # ModelTiepointTag
+                    tiepoint_tag = value
+            # Supplementary check for the log output we can see (raw detection)
+            # Look for any GeoTIFF tag indicators in the output
+            geotiff_indicators = ['ModelPixelScale', 'ModelTiepoint', 'GeoKey', 'GeoAscii']
+            has_geotiff_indicators = False
+            for indicator in geotiff_indicators:
+                if indicator in str(img.tag):
+                    has_geotiff_indicators = True
+                    logging.info(f"Found GeoTIFF indicator: {indicator}")
+                    break
+            # Look for any TIFF tag containing geographic info
+            log_pattern = r"ModelPixelScaleTag.*?value: b'(.*?)'"
+            log_matches = re.findall(log_pattern, str(img.tag))
+            # If we detect any GeoTIFF indicators or raw tags, consider it a Brazil image
+            if (log_matches or has_geotiff_indicators) and not pixel_scale_tag:
+                logging.info(f"GeoTIFF indicators detected in image")
+                # Remove hardcoded Brazil coordinates
+                # Try to extract values from raw tag data if possible
+                try:
+                    # Parse the modelPixelScale if available
+                    if log_matches:
+                        logging.info(f"Found raw pixel scale data: {log_matches[0]}")
+                        # We'll continue with the standard TIFF tag processing below
+                except Exception as e:
+                    logging.error(f"Error parsing raw tag data: {str(e)}")
+            if pixel_scale_tag and tiepoint_tag:
+                # Extract pixel scale (x, y)
+                x_scale = float(pixel_scale_tag[0])
+                y_scale = float(pixel_scale_tag[1])
+                # Extract model tiepoint (raster origin)
+                i, j, k = float(tiepoint_tag[0]), float(tiepoint_tag[1]), float(tiepoint_tag[2])
+                x, y, z = float(tiepoint_tag[3]), float(tiepoint_tag[4]), float(tiepoint_tag[5])
+                # Calculate bounds based on image dimensions
+                width, height = img.size
+                # Calculate bounds
+                min_lon = x
+                max_lat = y
+                max_lon = x + width * x_scale
+                min_lat = y - height * y_scale
+                logging.info(f"Extracted geo bounds: {min_lon},{min_lat} to {max_lon},{max_lat}")
+                return min_lat, min_lon, max_lat, max_lon
+            logging.info("No valid geospatial metadata found in TIFF")
+        # Check for EXIF GPS data (typically in JPEG)
+        elif hasattr(img, '_getexif') and img._getexif():
+            exif = img._getexif()
+            if exif and 34853 in exif:  # 34853 is the GPS Info tag
+                gps_info = exif[34853]
+                # Extract GPS data
+                if 1 in gps_info and 2 in gps_info and 3 in gps_info and 4 in gps_info:
+                    # Latitude
+                    lat_ref = gps_info[1]  # 'N' or 'S'
+                    lat = gps_info[2]  # ((deg_num, deg_denom), (min_num, min_denom), (sec_num, sec_denom))
+                    lat_val = lat[0][0]/lat[0][1] + lat[1][0]/(lat[1][1]*60) + lat[2][0]/(lat[2][1]*3600)
+                    if lat_ref == 'S':
+                        lat_val = -lat_val
+                    # Longitude
+                    lon_ref = gps_info[3]  # 'E' or 'W'
+                    lon = gps_info[4]
+                    lon_val = lon[0][0]/lon[0][1] + lon[1][0]/(lon[1][1]*60) + lon[2][0]/(lon[2][1]*3600)
+                    if lon_ref == 'W':
+                        lon_val = -lon_val
+                    # Create a small region around the point
+                    delta = 0.01  # ~1km at the equator
+                    min_lat = lat_val - delta
+                    min_lon = lon_val - delta
+                    max_lat = lat_val + delta
+                    max_lon = lon_val + delta
+                    logging.info(f"Extracted EXIF GPS bounds: {min_lon},{min_lat} to {max_lon},{max_lat}")
+                    return min_lat, min_lon, max_lat, max_lon
+            logging.info("No valid GPS metadata found in EXIF")
+        # If we get here, we couldn't extract coordinates
+        logging.warning("Could not extract geospatial coordinates from image")
+        return None
+    except Exception as e:
+        logging.error(f"Error extracting geo coordinates: {str(e)}")
+        return None
+def convert_to_geojson_with_transform(polygons, image_height, image_width,
+                                    min_lat=None, min_lon=None, max_lat=None, max_lon=None):
+    """
+    Convert polygons to GeoJSON with proper geographic transformation.
+    Args:
+        polygons (list): List of shapely Polygon objects
+        image_height (int): Height of the source image
+        image_width (int): Width of the source image
+        min_lat (float, optional): Minimum latitude for geographic bounds
+        min_lon (float, optional): Minimum longitude for geographic bounds
+        max_lat (float, optional): Maximum latitude for geographic bounds
+        max_lon (float, optional): Maximum longitude for geographic bounds
+    Returns:
+        dict: GeoJSON object
+    """
+    # Set default geographic bounds if not provided
+    if None in (min_lon, min_lat, max_lon, max_lat):
+        logging.warning("No geographic coordinates provided for GeoJSON transformation. Using default values.")
+        # Default to somewhere neutral (not in New York)
+        min_lon, min_lat = -98.0, 32.0  # Central US
+        max_lon, max_lat = -96.0, 34.0
+    # Create a GeoJSON feature collection
+    geojson = {
+        "type": "FeatureCollection",
+        "features": []
+    }
+    # Function to transform pixel coordinates to geographic coordinates
+    def transform_point(x, y):
+        # Linear interpolation
+        lon = min_lon + (x / image_width) * (max_lon - min_lon)
+        # Invert y-axis for geographic coordinates
+        lat = max_lat - (y / image_height) * (max_lat - min_lat)
+        return lon, lat
+    # Convert each polygon to a GeoJSON feature
+    for i, polygon in enumerate(polygons):
+        # Extract coordinates
+        coords = list(polygon.exterior.coords)
+        # Transform coordinates to geographic space
+        geo_coords = [transform_point(x, y) for x, y in coords]
+        # Create GeoJSON geometry
+        geometry = {
+            "type": "Polygon",
+            "coordinates": [geo_coords]
+        }
+        # Create GeoJSON feature
+        feature = {
+            "type": "Feature",
+            "id": i + 1,
+            "properties": {
+                "name": f"Feature {i+1}"
+            },
+            "geometry": geometry
+        }
+        geojson["features"].append(feature)
+    return geojson
+def process_image_to_geojson(image_path, feature_type="buildings", original_file_path=None):
+    """
+    Complete pipeline to convert an image to a simplified GeoJSON.
+    Args:
+        image_path (str): Path to the processed image
+        feature_type (str): Type of features to extract ("buildings", "trees", "water", "roads")
+        original_file_path (str, optional): Path to the original uploaded file
+    Returns:
+        dict: GeoJSON object
+    """
+    try:
+        # Open image to get dimensions
+        img = Image.open(image_path)
+        width, height = img.size
+        # Import segmentation module here to avoid circular imports
+        from utils.segmentation import segment_and_extract_features
+        # Extract features using advanced segmentation
+        _, polygons = segment_and_extract_features(
+            image_path,
+            output_mask_path=None,
+            feature_type=feature_type,
+            min_area=50,
+            simplify_tolerance=2.0,
+            merge_distance=5.0
+        )
+        if not polygons:
+            logging.warning("No polygons found in the image after segmentation")
+            return {"type": "FeatureCollection", "features": []}
+        # Use the provided original file path if available
+        original_image_path = original_file_path
+        # If no original file path was provided, try to find it
+        if not original_image_path and "_processed" in image_path:
+            original_image_path = image_path.replace("_processed", "")
+            # Try the original image path but replace the extension with common formats
+            if not os.path.exists(original_image_path):
+                base_path = original_image_path.rsplit('.', 1)[0]
+                for ext in ['.tif', '.tiff', '.jpg', '.jpeg', '.png']:
+                    if os.path.exists(base_path + ext):
+                        original_image_path = base_path + ext
+                        break
+        logging.info(f"Using original image path: {original_image_path}")
+        # Extract bounds from image if possible
+        coords = None
+        if original_image_path and os.path.exists(original_image_path):
+            logging.info(f"Checking original image for geospatial data: {original_image_path}")
+            coords = extract_geo_coordinates_from_image(original_image_path)
+        if not coords:
+            logging.info("Checking processed image for geospatial data")
+            coords = extract_geo_coordinates_from_image(image_path)
+        # Use extracted coordinates or defaults
+        if coords:
+            min_lat, min_lon, max_lat, max_lon = coords
+            logging.info(f"Using extracted coordinates: {min_lon},{min_lat} to {max_lon},{max_lat}")
+        else:
+            # Try one more time with rasterio directly on the original image if it exists
+            if original_image_path and os.path.exists(original_image_path) and original_image_path.lower().endswith(('.tif', '.tiff')):
+                try:
+                    import rasterio
+                    from rasterio.warp import transform_bounds
+                    with rasterio.open(original_image_path) as src:
+                        if src.crs is not None:
+                            bounds = src.bounds
+                            if src.crs.to_epsg() != 4326:
+                                west, south, east, north = transform_bounds(
+                                    src.crs, 'EPSG:4326',
+                                    bounds.left, bounds.bottom, bounds.right, bounds.top
+                                )
+                            else:
+                                west, south, east, north = bounds
+                            min_lat, min_lon, max_lat, max_lon = south, west, north, east
+                            logging.info(f"Using coordinates from rasterio: {min_lon},{min_lat} to {max_lon},{max_lat}")
+                except Exception as e:
+                    logging.warning(f"Failed to extract coordinates with rasterio: {str(e)}")
+                    logging.warning("No coordinates found in image, using default location in Central US")
+                    min_lat, min_lon = 32.0, -98.0  # Central US
+                    max_lat, max_lon = 34.0, -96.0
+            else:
+                logging.warning("No coordinates found in image, using default location in Central US")
+                min_lat, min_lon = 32.0, -98.0  # Central US
+                max_lat, max_lon = 34.0, -96.0
+        # Convert to GeoJSON with proper transformation
+        geojson = convert_to_geojson_with_transform(
+            polygons, height, width,
+            min_lat=min_lat, min_lon=min_lon,
+            max_lat=max_lat, max_lon=max_lon
+        )
+        return geojson
+    except Exception as e:
+        logging.error(f"Error in GeoJSON processing: {str(e)}")
+        return {"type": "FeatureCollection", "features": []}

utils/image_processing.py ADDED Viewed

	@@ -0,0 +1,68 @@

+import os
+import uuid
+import logging
+import numpy as np
+from PIL import Image, ImageEnhance, ImageFilter
+import cv2
+def process_image(image_path, output_folder):
+    """
+    Process the input image for geospatial analysis:
+    - Convert to grayscale
+    - Apply threshold to highlight features
+    - Apply noise reduction
+    - Apply edge detection
+    Args:
+        image_path (str): Path to the input image
+        output_folder (str): Directory to save processed images
+    Returns:
+        str: Path to the processed image
+    """
+    try:
+        logging.info(f"Processing image: {image_path}")
+        # Open the image
+        img = Image.open(image_path)
+        # Convert to RGB if it's not already
+        if img.mode != 'RGB':
+            img = img.convert('RGB')
+        # Convert to numpy array for OpenCV processing
+        img_array = np.array(img)
+        # Convert to grayscale
+        gray = cv2.cvtColor(img_array, cv2.COLOR_RGB2GRAY)
+        # Apply Gaussian blur for noise reduction
+        blurred = cv2.GaussianBlur(gray, (5, 5), 0)
+        # Apply adaptive thresholding
+        thresh = cv2.adaptiveThreshold(
+            blurred, 255, cv2.ADAPTIVE_THRESH_GAUSSIAN_C,
+            cv2.THRESH_BINARY_INV, 11, 2
+        )
+        # Edge detection using Canny algorithm
+        edges = cv2.Canny(thresh, 50, 150)
+        # Morphological operations to clean up the result
+        kernel = np.ones((3, 3), np.uint8)
+        cleaned = cv2.morphologyEx(edges, cv2.MORPH_CLOSE, kernel)
+        # Convert back to PIL Image
+        processed_img = Image.fromarray(cleaned)
+        # Save the processed image
+        processed_filename = f"{uuid.uuid4().hex}_processed.png"
+        output_path = os.path.join(output_folder, processed_filename)
+        processed_img.save(output_path)
+        logging.info(f"Image processing complete: {output_path}")
+        return output_path
+    except Exception as e:
+        logging.error(f"Error in image processing: {str(e)}")
+        raise Exception(f"Image processing failed: {str(e)}")

utils/segmentation.py ADDED Viewed

	@@ -0,0 +1,237 @@

+"""
+Segmentation utilities for image processing inspired by CLIPSeg techniques.
+This is a simplified version that does not require the full transformers library.
+"""
+import os
+import logging
+import numpy as np
+import cv2
+from PIL import Image
+from utils.geospatial import extract_contours, simplify_polygons, regularize_polygons, merge_nearby_polygons
+def segment_by_color_threshold(image_path, output_path=None,
+                              threshold=127, color_channel=1,
+                              smoothing_sigma=1.0):
+    """
+    Segment an image based on color thresholding.
+    This is a simple segmentation inspired by more complex models like CLIPSeg.
+    Args:
+        image_path (str): Path to the input image
+        output_path (str, optional): Path to save the segmentation mask
+        threshold (int): Pixel intensity threshold (0-255)
+        color_channel (int): Color channel to use for thresholding (0=R, 1=G, 2=B)
+        smoothing_sigma (float): Gaussian smoothing sigma
+    Returns:
+        numpy.ndarray: Segmentation mask
+    """
+    try:
+        # Read the image
+        img = cv2.imread(image_path)
+        if img is None:
+            # Try using PIL if OpenCV fails
+            pil_img = Image.open(image_path).convert('RGB')
+            img = np.array(pil_img)
+            img = img[:, :, ::-1]  # RGB to BGR for OpenCV compatibility
+        # Split channels and use the specified channel for segmentation
+        b, g, r = cv2.split(img)
+        channels = [r, g, b]
+        if 0 <= color_channel < 3:
+            channel = channels[color_channel]
+        else:
+            # Use grayscale if invalid channel specified
+            channel = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
+        # Apply Gaussian blur to reduce noise
+        if smoothing_sigma > 0:
+            channel = cv2.GaussianBlur(channel, (0, 0), smoothing_sigma)
+        # Apply thresholding to create binary mask
+        _, mask = cv2.threshold(channel, threshold, 255, cv2.THRESH_BINARY)
+        # Save the mask if output path is provided
+        if output_path:
+            cv2.imwrite(output_path, mask)
+            logging.info(f"Saved segmentation mask to {output_path}")
+        return mask
+    except Exception as e:
+        logging.error(f"Error in segmentation: {str(e)}")
+        return None
+def segment_by_adaptive_threshold(image_path, output_path=None,
+                                 block_size=11, c=2,
+                                 smoothing_sigma=1.0):
+    """
+    Segment an image using adaptive thresholding for better handling of
+    lighting variations.
+    Args:
+        image_path (str): Path to the input image
+        output_path (str, optional): Path to save the segmentation mask
+        block_size (int): Size of the pixel neighborhood for threshold calculation
+        c (int): Constant subtracted from the mean
+        smoothing_sigma (float): Gaussian smoothing sigma
+    Returns:
+        numpy.ndarray: Segmentation mask
+    """
+    try:
+        # Read the image
+        img = cv2.imread(image_path)
+        if img is None:
+            # Try using PIL if OpenCV fails
+            pil_img = Image.open(image_path).convert('RGB')
+            img = np.array(pil_img)
+            img = img[:, :, ::-1]  # RGB to BGR for OpenCV compatibility
+        # Convert to grayscale
+        gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
+        # Apply Gaussian blur to reduce noise
+        if smoothing_sigma > 0:
+            gray = cv2.GaussianBlur(gray, (0, 0), smoothing_sigma)
+        # Apply adaptive thresholding
+        mask = cv2.adaptiveThreshold(
+            gray, 255, cv2.ADAPTIVE_THRESH_GAUSSIAN_C,
+            cv2.THRESH_BINARY, block_size, c
+        )
+        # Save the mask if output path is provided
+        if output_path:
+            cv2.imwrite(output_path, mask)
+            logging.info(f"Saved segmentation mask to {output_path}")
+        return mask
+    except Exception as e:
+        logging.error(f"Error in segmentation: {str(e)}")
+        return None
+def segment_by_otsu(image_path, output_path=None, smoothing_sigma=1.0):
+    """
+    Segment an image using Otsu's automatic thresholding method.
+    Args:
+        image_path (str): Path to the input image
+        output_path (str, optional): Path to save the segmentation mask
+        smoothing_sigma (float): Gaussian smoothing sigma
+    Returns:
+        numpy.ndarray: Segmentation mask
+    """
+    try:
+        # Read the image
+        img = cv2.imread(image_path)
+        if img is None:
+            # Try using PIL if OpenCV fails
+            pil_img = Image.open(image_path).convert('RGB')
+            img = np.array(pil_img)
+            img = img[:, :, ::-1]  # RGB to BGR for OpenCV compatibility
+        # Convert to grayscale
+        gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
+        # Apply Gaussian blur to reduce noise
+        if smoothing_sigma > 0:
+            gray = cv2.GaussianBlur(gray, (0, 0), smoothing_sigma)
+        # Apply Otsu's thresholding
+        _, mask = cv2.threshold(gray, 0, 255, cv2.THRESH_BINARY + cv2.THRESH_OTSU)
+        # Save the mask if output path is provided
+        if output_path:
+            cv2.imwrite(output_path, mask)
+            logging.info(f"Saved segmentation mask to {output_path}")
+        return mask
+    except Exception as e:
+        logging.error(f"Error in segmentation: {str(e)}")
+        return None
+def segment_and_extract_features(image_path, output_mask_path=None,
+                                feature_type="buildings",
+                                min_area=50, simplify_tolerance=2.0,
+                                merge_distance=5.0):
+    """
+    Complete pipeline for segmentation and feature extraction.
+    Args:
+        image_path (str): Path to the input image
+        output_mask_path (str, optional): Path to save the segmentation mask
+        feature_type (str): Type of features to extract ("buildings", "trees", "water", "roads")
+        min_area (int): Minimum feature area to keep
+        simplify_tolerance (float): Tolerance for polygon simplification
+        merge_distance (float): Distance for merging nearby polygons
+    Returns:
+        tuple: (mask, polygons) - Segmentation mask and list of simplified Shapely polygons
+    """
+    # Choose segmentation method based on feature type
+    if feature_type.lower() == "buildings":
+        # Buildings typically have clean edges and good contrast
+        mask = segment_by_adaptive_threshold(
+            image_path, output_mask_path,
+            block_size=15, c=2, smoothing_sigma=1.0
+        )
+    elif feature_type.lower() == "trees" or feature_type.lower() == "vegetation":
+        # Trees typically strong in green channel
+        mask = segment_by_color_threshold(
+            image_path, output_mask_path,
+            threshold=140, color_channel=1, smoothing_sigma=1.5
+        )
+    elif feature_type.lower() == "water":
+        # Water typically has distinct spectral properties
+        mask = segment_by_color_threshold(
+            image_path, output_mask_path,
+            threshold=120, color_channel=0, smoothing_sigma=2.0
+        )
+    else:
+        # Default to Otsu for unknown feature types
+        mask = segment_by_otsu(
+            image_path, output_mask_path, smoothing_sigma=1.0
+        )
+    if mask is None:
+        logging.error("Segmentation failed")
+        return None, []
+    # Save mask temporarily if needed for contour extraction
+    temp_mask_path = None
+    if not output_mask_path:
+        temp_mask_path = os.path.join(
+            os.path.dirname(image_path),
+            f"{os.path.splitext(os.path.basename(image_path))[0]}_mask.png"
+        )
+        cv2.imwrite(temp_mask_path, mask)
+        mask_path = temp_mask_path
+    else:
+        mask_path = output_mask_path
+    # Extract contours from the mask
+    polygons = extract_contours(mask_path, min_area=min_area)
+    logging.info(f"Extracted {len(polygons)} initial polygons")
+    # Clean up temporary file if created
+    if temp_mask_path and os.path.exists(temp_mask_path):
+        os.remove(temp_mask_path)
+    # Simplify polygons
+    polygons = simplify_polygons(polygons, tolerance=simplify_tolerance)
+    # If buildings, regularize them to make more rectangular
+    if feature_type.lower() == "buildings":
+        polygons = regularize_polygons(polygons)
+    # Merge nearby polygons to reduce count
+    polygons = merge_nearby_polygons(polygons, distance_threshold=merge_distance)
+    logging.info(f"After processing: {len(polygons)} polygons")
+    return mask, polygons