diff --git a/jetson/ros2_ws/src/saltybot_segmentation/config/segmentation_params.yaml b/jetson/ros2_ws/src/saltybot_segmentation/config/segmentation_params.yaml
new file mode 100644
index 0000000..2c6256b
--- /dev/null
+++ b/jetson/ros2_ws/src/saltybot_segmentation/config/segmentation_params.yaml
@@ -0,0 +1,64 @@
+# segmentation_params.yaml — SaltyBot sidewalk semantic segmentation
+#
+# Run with:
+#   ros2 launch saltybot_segmentation sidewalk_segmentation.launch.py
+#
+# Build TRT engine first (run ONCE on the Jetson):
+#   python3 /opt/ros/humble/share/saltybot_segmentation/scripts/build_engine.py
+
+# ── Model paths ───────────────────────────────────────────────────────────────
+# Priority: TRT engine > ONNX > error (no inference)
+#
+# Build engine:
+#   python3 build_engine.py --model bisenetv2
+#   → /mnt/nvme/saltybot/models/bisenetv2_cityscapes_512x256.engine
+engine_path: /mnt/nvme/saltybot/models/bisenetv2_cityscapes_512x256.engine
+onnx_path:   /mnt/nvme/saltybot/models/bisenetv2_cityscapes_512x256.onnx
+
+# ── Model input size ──────────────────────────────────────────────────────────
+# Must match the engine. 512×256 maintains Cityscapes 2:1 aspect ratio.
+# RealSense 640×480 is letterboxed to 512×256 (pillarboxed, 32px each side).
+input_width:  512
+input_height: 256
+
+# ── Processing rate ───────────────────────────────────────────────────────────
+# process_every_n: run inference on 1 in N frames.
+#   1 = every frame  (~15fps if latency budget allows)
+#   2 = every 2nd frame (recommended — RealSense @ 30fps → ~15fps effective)
+#   3 = every 3rd frame (9fps — use if GPU is constrained by other tasks)
+#
+# RealSense color at 15fps → process_every_n:=1 gives ~15fps seg output.
+process_every_n: 1
+
+# ── Debug image ───────────────────────────────────────────────────────────────
+# Set true to publish /segmentation/debug_image (BGR colour overlay).
+# Adds ~1ms/frame overhead. Disable in production.
+publish_debug_image: false
+
+# ── Traversability overrides ──────────────────────────────────────────────────
+# unknown_as_obstacle: true → sky / unlabelled pixels → lethal (100).
+#   Use in dense urban environments where unknowns are likely vertical surfaces.
+#   Use false (default) in open spaces to allow exploration.
+unknown_as_obstacle: false
+
+# ── Costmap projection ────────────────────────────────────────────────────────
+# costmap_resolution: metres per cell in the output OccupancyGrid.
+#   Match or exceed Nav2 local_costmap resolution (default 0.05m).
+costmap_resolution: 0.05     # metres/cell
+
+# costmap_range_m: forward look-ahead distance for ground projection.
+#   5.0m covers 100 cells at 0.05m resolution.
+#   Increase for faster outdoor navigation; decrease for tight indoor spaces.
+costmap_range_m: 5.0         # metres
+
+# ── Camera geometry ───────────────────────────────────────────────────────────
+# These must match the RealSense mount position on the robot.
+# Used for inverse-perspective ground projection.
+#
+# camera_height_m: height of RealSense optical centre above ground (metres).
+#   saltybot: D435i mounted at ~0.15m above base_link origin.
+camera_height_m: 0.15        # metres
+
+# camera_pitch_deg: downward tilt of the camera (degrees, positive = tilted down).
+#   0 = horizontal. Typical outdoor deployment: 5–10° downward.
+camera_pitch_deg: 5.0        # degrees
diff --git a/jetson/ros2_ws/src/saltybot_segmentation/docs/training_guide.md b/jetson/ros2_ws/src/saltybot_segmentation/docs/training_guide.md
new file mode 100644
index 0000000..147fdb4
--- /dev/null
+++ b/jetson/ros2_ws/src/saltybot_segmentation/docs/training_guide.md
@@ -0,0 +1,268 @@
+# Sidewalk Segmentation — Training & Deployment Guide
+
+## Overview
+
+SaltyBot uses **BiSeNetV2** (default) or **DDRNet-23-slim** for real-time semantic
+segmentation, pre-trained on Cityscapes and optionally fine-tuned on site-specific data.
+
+The model runs at **>15fps on Orin Nano Super** via TensorRT FP16 at 512×256 input,
+publishing per-pixel traversability costs to Nav2.
+
+---
+
+## Traversability Classes
+
+| Class | ID | OccupancyGrid | Description |
+|-------|----|---------------|-------------|
+| Sidewalk | 0 | 0 (free) | Preferred navigation surface |
+| Grass/vegetation | 1 | 50 (medium) | Traversable but non-preferred |
+| Road | 2 | 90 (high cost) | Avoid but can cross |
+| Obstacle | 3 | 100 (lethal) | Person, car, building, fence |
+| Unknown | 4 | -1 (unknown) | Sky, unlabelled |
+
+---
+
+## Quick Start — Pretrained Cityscapes Model
+
+No training required for standard sidewalks in Western cities.
+
+```bash
+# 1. Build the TRT engine (once, on Orin):
+python3 /opt/ros/humble/share/saltybot_segmentation/scripts/build_engine.py
+
+# 2. Launch:
+ros2 launch saltybot_segmentation sidewalk_segmentation.launch.py
+
+# 3. Verify:
+ros2 topic hz /segmentation/mask        # expect ~15Hz
+ros2 topic hz /segmentation/costmap     # expect ~15Hz
+ros2 run rviz2 rviz2                    # add OccupancyGrid, topic=/segmentation/costmap
+```
+
+---
+
+## Model Benchmarks — Cityscapes Validation Set
+
+| Model | mIoU | Sidewalk IoU | Road IoU | FPS (Orin FP16) | Engine size |
+|-------|------|--------------|----------|-----------------|-------------|
+| BiSeNetV2 | 72.6% | 82.1% | 97.8% | ~50 fps | ~11 MB |
+| DDRNet-23-slim | 79.5% | 84.3% | 98.1% | ~40 fps | ~18 MB |
+
+Both exceed the **>15fps target** with headroom for additional ROS2 overhead.
+
+BiSeNetV2 is the default — faster, smaller, sufficient for traversability.
+Use DDRNet if mIoU matters more than latency (e.g., complex European city centres).
+
+---
+
+## Fine-Tuning on Custom Site Data
+
+### When is fine-tuning needed?
+
+The Cityscapes-trained model works well for:
+- European-style city sidewalks, curbs, roads
+- Standard pedestrian infrastructure
+
+Fine-tuning improves performance for:
+- Gravel/dirt paths (not in Cityscapes)
+- Unusual kerb styles or non-standard pavement markings
+- Indoor+outdoor transitions (garage exits, building entrances)
+- Non-Western road infrastructure
+
+### Step 1 — Collect data (walk the route)
+
+Record a ROS2 bag while walking the intended robot route:
+
+```bash
+# On Orin, record the front camera for 5–10 minutes of the target environment:
+ros2 bag record /camera/color/image_raw -o sidewalk_route_2024-01
+
+# Transfer to workstation for labelling:
+scp -r jetson:/home/ubuntu/sidewalk_route_2024-01 ~/datasets/
+```
+
+### Step 2 — Extract frames
+
+```bash
+python3 fine_tune.py \
+    --extract-frames ~/datasets/sidewalk_route_2024-01/ \
+    --output-dir ~/datasets/sidewalk_raw/ \
+    --every-n 5       # 1 frame per 5 = ~6fps from 30fps bag
+```
+
+This extracts ~200–400 frames from a 5-minute bag. You need to label **50–100 frames** minimum.
+
+### Step 3 — Label with LabelMe
+
+```bash
+pip install labelme
+labelme ~/datasets/sidewalk_raw/
+```
+
+**Class names to use** (must be exact):
+
+| What you see | LabelMe label |
+|--------------|---------------|
+| Footpath/pavement | `sidewalk` |
+| Road/tarmac | `road` |
+| Grass/lawn/verge | `vegetation` |
+| Gravel path | `terrain` |
+| Person | `person` |
+| Car/vehicle | `car` |
+| Building/wall | `building` |
+| Fence/gate | `fence` |
+
+**Labelling tips:**
+- Use **polygon** tool for precise boundaries
+- Focus on the ground plane (lower 60% of image) — that's what the costmap uses
+- 50 well-labelled frames beats 200 rushed ones
+- Vary conditions: sunny, overcast, morning, evening
+
+### Step 4 — Convert labels to masks
+
+```bash
+python3 fine_tune.py \
+    --convert-labels ~/datasets/sidewalk_raw/ \
+    --output-dir ~/datasets/sidewalk_masks/
+```
+
+Output: `<frame>_mask.png` per frame — 8-bit PNG with Cityscapes class IDs.
+Unlabelled pixels are set to 255 (ignored during training).
+
+### Step 5 — Fine-tune
+
+```bash
+# On Orin (or workstation with CUDA):
+python3 fine_tune.py --train \
+    --images  ~/datasets/sidewalk_raw/ \
+    --labels  ~/datasets/sidewalk_masks/ \
+    --weights /mnt/nvme/saltybot/models/bisenetv2_cityscapes.pth \
+    --output  /mnt/nvme/saltybot/models/bisenetv2_custom.pth \
+    --epochs  20 \
+    --lr      1e-4
+```
+
+Expected training time:
+- 50 images, 20 epochs, Orin: ~15 minutes
+- 100 images, 20 epochs, Orin: ~25 minutes
+
+### Step 6 — Evaluate mIoU
+
+```bash
+python3 fine_tune.py --eval \
+    --images ~/datasets/sidewalk_raw/ \
+    --labels ~/datasets/sidewalk_masks/ \
+    --weights /mnt/nvme/saltybot/models/bisenetv2_custom.pth
+```
+
+Target mIoU on custom classes: >70% on sidewalk/road/obstacle.
+
+### Step 7 — Build new TRT engine
+
+```bash
+python3 build_engine.py \
+    --weights /mnt/nvme/saltybot/models/bisenetv2_custom.pth \
+    --engine  /mnt/nvme/saltybot/models/bisenetv2_custom_512x256.engine
+```
+
+Update `segmentation_params.yaml`:
+```yaml
+engine_path: /mnt/nvme/saltybot/models/bisenetv2_custom_512x256.engine
+```
+
+---
+
+## Nav2 Integration — SegmentationCostmapLayer
+
+Add to `nav2_params.yaml`:
+
+```yaml
+local_costmap:
+  local_costmap:
+    ros__parameters:
+      plugins:
+        - "voxel_layer"
+        - "inflation_layer"
+        - "segmentation_layer"   # ← add this
+
+      segmentation_layer:
+        plugin: "saltybot_segmentation_costmap::SegmentationCostmapLayer"
+        enabled: true
+        topic: /segmentation/costmap
+        combination_method: max     # max | override | min
+```
+
+**combination_method:**
+- `max` (default) — keeps the worst-case cost between existing costmap and segmentation.
+  Most conservative; prevents Nav2 from overriding obstacle detections.
+- `override` — segmentation completely replaces existing cell costs.
+  Use when you trust the camera more than other sensors.
+- `min` — keeps the most permissive cost.
+  Use for exploratory navigation in open environments.
+
+---
+
+## Performance Tuning
+
+### Too slow (<15fps)
+
+1. **Reduce process_every_n** (e.g., `process_every_n: 2` → effective 15fps from 30fps camera)
+2. **Reduce input resolution** — edit `build_engine.py` to use 384×192 (2.2× faster)
+3. **Ensure nvpmodel is in MAXN mode**: `sudo nvpmodel -m 0 && sudo jetson_clocks`
+4. Check GPU is not throttled: `jtop` → GPU frequency should be 1024MHz
+
+### False road detections (sidewalk near road)
+
+- Lower `camera_pitch_deg` to look further ahead
+- Enable `unknown_as_obstacle: true` to be more cautious
+- Fine-tune with site-specific data (Step 5)
+
+### Costmap looks noisy
+
+- Increase `costmap_resolution` (0.1m cells reduce noise)
+- Reduce `costmap_range_m` to 3.0m (projection less accurate at far range)
+- Apply temporal smoothing in Nav2 inflation layer
+
+---
+
+## Datasets
+
+### Cityscapes (primary pre-training)
+- **2975 training / 500 validation** finely annotated images
+- 19 semantic classes (roads, sidewalks, people, vehicles, etc.)
+- License: Cityscapes Terms of Use (non-commercial research)
+- Download: https://www.cityscapes-dataset.com/
+- Required for training from scratch; BiSeNetV2 pretrained checkpoint (~25MB) available at:
+  https://github.com/CoinCheung/BiSeNet/releases
+
+### Mapillary Vistas (supplementary)
+- **18,000 training images** from diverse global street scenes
+- 124 semantic classes (broader coverage than Cityscapes)
+- Includes dirt paths, gravel, unusual sidewalk types
+- License: CC BY-SA 4.0
+- Download: https://www.mapillary.com/dataset/vistas
+- Useful for mapping to our traversability classes in non-European environments
+
+### Custom saltybot data
+- Collected per-deployment via `fine_tune.py --extract-frames`
+- 50–100 labelled frames typical for 80%+ mIoU on specific routes
+- Store in `/mnt/nvme/saltybot/training_data/`
+
+---
+
+## File Locations on Orin
+
+```
+/mnt/nvme/saltybot/
+├── models/
+│   ├── bisenetv2_cityscapes.pth              ← downloaded pretrained weights
+│   ├── bisenetv2_cityscapes_512x256.onnx     ← exported ONNX (FP32)
+│   ├── bisenetv2_cityscapes_512x256.engine   ← TRT FP16 engine (built on Orin)
+│   ├── bisenetv2_custom.pth                  ← fine-tuned weights (after step 5)
+│   └── bisenetv2_custom_512x256.engine       ← TRT FP16 engine (after step 7)
+├── training_data/
+│   ├── raw/                                  ← extracted JPEG frames
+│   └── labels/                              ← LabelMe JSON + converted PNG masks
+└── rosbags/
+    └── sidewalk_route_*/                     ← recorded ROS2 bags for labelling
+```
diff --git a/jetson/ros2_ws/src/saltybot_segmentation/launch/sidewalk_segmentation.launch.py b/jetson/ros2_ws/src/saltybot_segmentation/launch/sidewalk_segmentation.launch.py
new file mode 100644
index 0000000..5132e4d
--- /dev/null
+++ b/jetson/ros2_ws/src/saltybot_segmentation/launch/sidewalk_segmentation.launch.py
@@ -0,0 +1,58 @@
+"""
+sidewalk_segmentation.launch.py — Launch semantic sidewalk segmentation node.
+
+Usage:
+  ros2 launch saltybot_segmentation sidewalk_segmentation.launch.py
+  ros2 launch saltybot_segmentation sidewalk_segmentation.launch.py publish_debug_image:=true
+  ros2 launch saltybot_segmentation sidewalk_segmentation.launch.py engine_path:=/custom/model.engine
+"""
+
+import os
+from ament_index_python.packages import get_package_share_directory
+from launch import LaunchDescription
+from launch.actions import DeclareLaunchArgument
+from launch.substitutions import LaunchConfiguration
+from launch_ros.actions import Node
+
+
+def generate_launch_description():
+    pkg = get_package_share_directory("saltybot_segmentation")
+    cfg = os.path.join(pkg, "config", "segmentation_params.yaml")
+
+    return LaunchDescription([
+        DeclareLaunchArgument("engine_path",
+            default_value="/mnt/nvme/saltybot/models/bisenetv2_cityscapes_512x256.engine",
+            description="Path to TensorRT .engine file"),
+        DeclareLaunchArgument("onnx_path",
+            default_value="/mnt/nvme/saltybot/models/bisenetv2_cityscapes_512x256.onnx",
+            description="Path to ONNX fallback model"),
+        DeclareLaunchArgument("process_every_n", default_value="1",
+            description="Run inference every N frames (1=every frame)"),
+        DeclareLaunchArgument("publish_debug_image", default_value="false",
+            description="Publish colour-coded debug image on /segmentation/debug_image"),
+        DeclareLaunchArgument("unknown_as_obstacle", default_value="false",
+            description="Treat unknown pixels as lethal obstacles"),
+        DeclareLaunchArgument("costmap_range_m", default_value="5.0",
+            description="Forward look-ahead range for costmap projection (m)"),
+        DeclareLaunchArgument("camera_pitch_deg", default_value="5.0",
+            description="Camera downward pitch angle (degrees)"),
+
+        Node(
+            package="saltybot_segmentation",
+            executable="sidewalk_seg",
+            name="sidewalk_seg",
+            output="screen",
+            parameters=[
+                cfg,
+                {
+                    "engine_path":          LaunchConfiguration("engine_path"),
+                    "onnx_path":            LaunchConfiguration("onnx_path"),
+                    "process_every_n":      LaunchConfiguration("process_every_n"),
+                    "publish_debug_image":  LaunchConfiguration("publish_debug_image"),
+                    "unknown_as_obstacle":  LaunchConfiguration("unknown_as_obstacle"),
+                    "costmap_range_m":      LaunchConfiguration("costmap_range_m"),
+                    "camera_pitch_deg":     LaunchConfiguration("camera_pitch_deg"),
+                },
+            ],
+        ),
+    ])
diff --git a/jetson/ros2_ws/src/saltybot_segmentation/package.xml b/jetson/ros2_ws/src/saltybot_segmentation/package.xml
new file mode 100644
index 0000000..41f0936
--- /dev/null
+++ b/jetson/ros2_ws/src/saltybot_segmentation/package.xml
@@ -0,0 +1,32 @@
+<?xml version="1.0"?>
+<?xml-model href="http://download.ros.org/schema/package_format3.xsd" schematypens="http://www.w3.org/2001/XMLSchema"?>
+<package format="3">
+  <name>saltybot_segmentation</name>
+  <version>0.1.0</version>
+  <description>
+    Semantic sidewalk segmentation for SaltyBot outdoor autonomous navigation.
+    BiSeNetV2 / DDRNet-23-slim with TensorRT FP16 on Orin Nano Super.
+    Publishes traversability mask + Nav2 OccupancyGrid costmap.
+  </description>
+  <maintainer email="seb@vayrette.com">seb</maintainer>
+  <license>MIT</license>
+
+  <buildtool_depend>ament_python</buildtool_depend>
+
+  <depend>rclpy</depend>
+  <depend>sensor_msgs</depend>
+  <depend>nav_msgs</depend>
+  <depend>std_msgs</depend>
+  <depend>cv_bridge</depend>
+  <depend>python3-numpy</depend>
+  <depend>python3-opencv</depend>
+
+  <test_depend>ament_copyright</test_depend>
+  <test_depend>ament_flake8</test_depend>
+  <test_depend>ament_pep257</test_depend>
+  <test_depend>pytest</test_depend>
+
+  <export>
+    <build_type>ament_python</build_type>
+  </export>
+</package>
diff --git a/jetson/ros2_ws/src/saltybot_segmentation/resource/saltybot_segmentation b/jetson/ros2_ws/src/saltybot_segmentation/resource/saltybot_segmentation
new file mode 100644
index 0000000..e69de29
diff --git a/jetson/ros2_ws/src/saltybot_segmentation/saltybot_segmentation/__init__.py b/jetson/ros2_ws/src/saltybot_segmentation/saltybot_segmentation/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/jetson/ros2_ws/src/saltybot_segmentation/saltybot_segmentation/seg_utils.py b/jetson/ros2_ws/src/saltybot_segmentation/saltybot_segmentation/seg_utils.py
new file mode 100644
index 0000000..1a41f35
--- /dev/null
+++ b/jetson/ros2_ws/src/saltybot_segmentation/saltybot_segmentation/seg_utils.py
@@ -0,0 +1,273 @@
+"""
+seg_utils.py — Pure helpers for semantic segmentation and traversability mapping.
+
+No ROS2, TensorRT, or PyTorch imports — fully testable without GPU or ROS2 install.
+
+Cityscapes 19-class → 5-class traversability mapping
+──────────────────────────────────────────────────────
+  Cityscapes ID → Traversability class → OccupancyGrid value
+
+  0  road         → ROAD      → 90   (high cost — don't drive on road)
+  1  sidewalk     → SIDEWALK  → 0    (free — preferred surface)
+  2  building     → OBSTACLE  → 100  (lethal)
+  3  wall         → OBSTACLE  → 100
+  4  fence        → OBSTACLE  → 100
+  5  pole         → OBSTACLE  → 100
+  6  traffic light→ OBSTACLE  → 100
+  7  traffic sign → OBSTACLE  → 100
+  8  vegetation   → GRASS     → 50   (medium — can traverse slowly)
+  9  terrain      → GRASS     → 50
+  10 sky          → UNKNOWN   → -1   (unknown)
+  11 person       → OBSTACLE  → 100  (lethal — safety critical)
+  12 rider        → OBSTACLE  → 100
+  13 car          → OBSTACLE  → 100
+  14 truck        → OBSTACLE  → 100
+  15 bus          → OBSTACLE  → 100
+  16 train        → OBSTACLE  → 100
+  17 motorcycle   → OBSTACLE  → 100
+  18 bicycle      → OBSTACLE  → 100
+
+Segmentation mask class IDs (published on /segmentation/mask)
+─────────────────────────────────────────────────────────────
+  TRAV_SIDEWALK = 0
+  TRAV_GRASS    = 1
+  TRAV_ROAD     = 2
+  TRAV_OBSTACLE = 3
+  TRAV_UNKNOWN  = 4
+"""
+
+import numpy as np
+
+# ── Traversability class constants ────────────────────────────────────────────
+
+TRAV_SIDEWALK = 0
+TRAV_GRASS    = 1
+TRAV_ROAD     = 2
+TRAV_OBSTACLE = 3
+TRAV_UNKNOWN  = 4
+
+NUM_TRAV_CLASSES = 5
+
+# ── OccupancyGrid cost values for each traversability class ───────────────────
+# Nav2 OccupancyGrid: 0=free, 1-99=cost, 100=lethal, -1=unknown
+
+TRAV_TO_COST = {
+    TRAV_SIDEWALK: 0,     # free — preferred surface
+    TRAV_GRASS:    50,    # medium cost — traversable but non-preferred
+    TRAV_ROAD:     90,    # high cost — avoid but can cross
+    TRAV_OBSTACLE: 100,   # lethal — never enter
+    TRAV_UNKNOWN:  -1,    # unknown — Nav2 treats as unknown cell
+}
+
+# ── Cityscapes 19-class → traversability lookup table ─────────────────────────
+# Index = Cityscapes training ID (0–18)
+
+_CITYSCAPES_TO_TRAV = np.array([
+    TRAV_ROAD,      # 0  road
+    TRAV_SIDEWALK,  # 1  sidewalk
+    TRAV_OBSTACLE,  # 2  building
+    TRAV_OBSTACLE,  # 3  wall
+    TRAV_OBSTACLE,  # 4  fence
+    TRAV_OBSTACLE,  # 5  pole
+    TRAV_OBSTACLE,  # 6  traffic light
+    TRAV_OBSTACLE,  # 7  traffic sign
+    TRAV_GRASS,     # 8  vegetation
+    TRAV_GRASS,     # 9  terrain
+    TRAV_UNKNOWN,   # 10 sky
+    TRAV_OBSTACLE,  # 11 person
+    TRAV_OBSTACLE,  # 12 rider
+    TRAV_OBSTACLE,  # 13 car
+    TRAV_OBSTACLE,  # 14 truck
+    TRAV_OBSTACLE,  # 15 bus
+    TRAV_OBSTACLE,  # 16 train
+    TRAV_OBSTACLE,  # 17 motorcycle
+    TRAV_OBSTACLE,  # 18 bicycle
+], dtype=np.uint8)
+
+# ── Visualisation colour map (BGR, for cv2.imshow / debug image) ──────────────
+# One colour per traversability class
+
+TRAV_COLORMAP_BGR = np.array([
+    [128, 64, 128],   # SIDEWALK  — purple
+    [152, 251, 152],  # GRASS     — pale green
+    [128,   0, 128],  # ROAD      — dark magenta
+    [ 60,  20, 220],  # OBSTACLE  — red-ish
+    [  0,   0,   0],  # UNKNOWN   — black
+], dtype=np.uint8)
+
+
+# ── Core mapping functions ────────────────────────────────────────────────────
+
+def cityscapes_to_traversability(mask: np.ndarray) -> np.ndarray:
+    """
+    Map a Cityscapes 19-class segmentation mask to traversability classes.
+
+    Parameters
+    ----------
+    mask : np.ndarray, shape (H, W), dtype uint8
+        Cityscapes class IDs in range [0, 18]. Values outside range are
+        mapped to TRAV_UNKNOWN.
+
+    Returns
+    -------
+    trav_mask : np.ndarray, shape (H, W), dtype uint8
+        Traversability class IDs in range [0, 4].
+    """
+    # Clamp out-of-range IDs to a safe default (unknown)
+    clipped = np.clip(mask.astype(np.int32), 0, len(_CITYSCAPES_TO_TRAV) - 1)
+    return _CITYSCAPES_TO_TRAV[clipped]
+
+
+def traversability_to_costmap(
+    trav_mask: np.ndarray,
+    unknown_as_obstacle: bool = False,
+) -> np.ndarray:
+    """
+    Convert a traversability mask to Nav2 OccupancyGrid int8 cost values.
+
+    Parameters
+    ----------
+    trav_mask : np.ndarray, shape (H, W), dtype uint8
+        Traversability class IDs (TRAV_* constants).
+    unknown_as_obstacle : bool
+        If True, TRAV_UNKNOWN cells are set to 100 (lethal) instead of -1.
+        Useful in dense urban environments where unknowns are likely walls.
+
+    Returns
+    -------
+    cost_map : np.ndarray, shape (H, W), dtype int8
+        OccupancyGrid cost values: 0=free, 1-99=cost, 100=lethal, -1=unknown.
+    """
+    H, W = trav_mask.shape
+    cost_map = np.full((H, W), -1, dtype=np.int8)
+
+    for trav_class, cost in TRAV_TO_COST.items():
+        if trav_class == TRAV_UNKNOWN and unknown_as_obstacle:
+            cost = 100
+        cost_map[trav_mask == trav_class] = cost
+
+    return cost_map
+
+
+def letterbox(
+    image: np.ndarray,
+    target_w: int,
+    target_h: int,
+    pad_value: int = 114,
+) -> tuple:
+    """
+    Letterbox-resize an image to (target_w, target_h) preserving aspect ratio.
+
+    Parameters
+    ----------
+    image : np.ndarray, shape (H, W, C), dtype uint8
+    target_w, target_h : int
+        Target width and height.
+    pad_value : int
+        Padding fill value.
+
+    Returns
+    -------
+    (canvas, scale, pad_left, pad_top) : tuple
+        canvas   : np.ndarray (target_h, target_w, C) — resized + padded image
+        scale    : float — scale factor applied (min of w_scale, h_scale)
+        pad_left : int — horizontal padding (pixels from left)
+        pad_top  : int — vertical padding (pixels from top)
+    """
+    import cv2  # lazy import — keeps module importable without cv2 in tests
+
+    src_h, src_w = image.shape[:2]
+    scale = min(target_w / src_w, target_h / src_h)
+    new_w = int(round(src_w * scale))
+    new_h = int(round(src_h * scale))
+
+    resized = cv2.resize(image, (new_w, new_h), interpolation=cv2.INTER_LINEAR)
+
+    pad_left = (target_w - new_w) // 2
+    pad_top  = (target_h - new_h) // 2
+
+    canvas = np.full((target_h, target_w, image.shape[2]), pad_value, dtype=np.uint8)
+    canvas[pad_top:pad_top + new_h, pad_left:pad_left + new_w] = resized
+
+    return canvas, scale, pad_left, pad_top
+
+
+def unpad_mask(
+    mask: np.ndarray,
+    orig_h: int,
+    orig_w: int,
+    scale: float,
+    pad_left: int,
+    pad_top: int,
+) -> np.ndarray:
+    """
+    Remove letterbox padding from a segmentation mask and resize to original.
+
+    Parameters
+    ----------
+    mask : np.ndarray, shape (target_h, target_w), dtype uint8
+        Segmentation output from model at letterboxed resolution.
+    orig_h, orig_w : int
+        Original image dimensions (before letterboxing).
+    scale, pad_left, pad_top : from letterbox()
+
+    Returns
+    -------
+    restored : np.ndarray, shape (orig_h, orig_w), dtype uint8
+    """
+    import cv2
+
+    new_h = int(round(orig_h * scale))
+    new_w = int(round(orig_w * scale))
+
+    cropped = mask[pad_top:pad_top + new_h, pad_left:pad_left + new_w]
+    restored = cv2.resize(cropped, (orig_w, orig_h), interpolation=cv2.INTER_NEAREST)
+    return restored
+
+
+def preprocess_for_inference(
+    image_bgr: np.ndarray,
+    input_w: int = 512,
+    input_h: int = 256,
+) -> tuple:
+    """
+    Preprocess a BGR image for BiSeNetV2 / DDRNet inference.
+
+    Applies letterboxing, BGR→RGB conversion, ImageNet normalisation,
+    HWC→NCHW layout, and float32 conversion.
+
+    Returns
+    -------
+    (blob, scale, pad_left, pad_top) : tuple
+        blob : np.ndarray (1, 3, input_h, input_w) float32 — model input
+        scale, pad_left, pad_top : for unpad_mask()
+    """
+    import cv2
+
+    canvas, scale, pad_left, pad_top = letterbox(image_bgr, input_w, input_h)
+
+    # BGR → RGB
+    rgb = cv2.cvtColor(canvas, cv2.COLOR_BGR2RGB)
+
+    # ImageNet normalisation
+    mean = np.array([0.485, 0.456, 0.406], dtype=np.float32)
+    std  = np.array([0.229, 0.224, 0.225], dtype=np.float32)
+    img  = rgb.astype(np.float32) / 255.0
+    img  = (img - mean) / std
+
+    # HWC → NCHW
+    blob = np.ascontiguousarray(img.transpose(2, 0, 1)[np.newaxis])
+
+    return blob, scale, pad_left, pad_top
+
+
+def colorise_traversability(trav_mask: np.ndarray) -> np.ndarray:
+    """
+    Convert traversability mask to an RGB visualisation image.
+
+    Returns
+    -------
+    vis : np.ndarray (H, W, 3) uint8 BGR — suitable for cv2.imshow / ROS Image
+    """
+    clipped = np.clip(trav_mask.astype(np.int32), 0, NUM_TRAV_CLASSES - 1)
+    return TRAV_COLORMAP_BGR[clipped]
diff --git a/jetson/ros2_ws/src/saltybot_segmentation/saltybot_segmentation/sidewalk_seg_node.py b/jetson/ros2_ws/src/saltybot_segmentation/saltybot_segmentation/sidewalk_seg_node.py
new file mode 100644
index 0000000..865131a
--- /dev/null
+++ b/jetson/ros2_ws/src/saltybot_segmentation/saltybot_segmentation/sidewalk_seg_node.py
@@ -0,0 +1,437 @@
+"""
+sidewalk_seg_node.py — Semantic sidewalk segmentation node for SaltyBot.
+
+Subscribes:
+  /camera/color/image_raw   (sensor_msgs/Image) — RealSense front RGB
+
+Publishes:
+  /segmentation/mask        (sensor_msgs/Image, mono8) — traversability class per pixel
+  /segmentation/costmap     (nav_msgs/OccupancyGrid)   — Nav2 traversability scores
+  /segmentation/debug_image (sensor_msgs/Image, bgr8)  — colour-coded visualisation
+
+Model backend (auto-selected, priority order)
+─────────────────────────────────────────────
+  1. TensorRT FP16 engine (.engine file)   — fastest, Orin GPU
+  2. ONNX Runtime (CUDA provider)          — fallback, still GPU
+  3. ONNX Runtime (CPU provider)           — last resort
+
+Build TRT engine:
+  python3 /opt/ros/humble/share/saltybot_segmentation/scripts/build_engine.py
+
+Supported model architectures
+──────────────────────────────
+  BiSeNetV2   — Cityscapes 72.6 mIoU, ~50fps @ 512×256 on Orin
+  DDRNet-23   — Cityscapes 79.5 mIoU, ~40fps @ 512×256 on Orin
+
+Performance target: >15fps at 512×256 on Jetson Orin Nano Super.
+
+Input:  512×256 RGB (letterboxed from 640×480 RealSense color)
+Output: 512×256 per-pixel traversability class ID (uint8)
+"""
+
+import threading
+import time
+
+import cv2
+import numpy as np
+import rclpy
+from cv_bridge import CvBridge
+from nav_msgs.msg import OccupancyGrid, MapMetaData
+from rclpy.node import Node
+from rclpy.qos import QoSProfile, ReliabilityPolicy, HistoryPolicy, DurabilityPolicy
+from sensor_msgs.msg import Image
+from std_msgs.msg import Header
+
+from saltybot_segmentation.seg_utils import (
+    cityscapes_to_traversability,
+    traversability_to_costmap,
+    preprocess_for_inference,
+    unpad_mask,
+    colorise_traversability,
+)
+
+# ── TensorRT backend ──────────────────────────────────────────────────────────
+
+try:
+    import tensorrt as trt
+    import pycuda.driver as cuda
+    import pycuda.autoinit  # noqa: F401 — initialises CUDA context
+    _TRT_AVAILABLE = True
+except ImportError:
+    _TRT_AVAILABLE = False
+
+
+class _TRTBackend:
+    """TensorRT FP16 inference backend."""
+
+    def __init__(self, engine_path: str, logger):
+        self._logger = logger
+        trt_logger = trt.Logger(trt.Logger.WARNING)
+        with open(engine_path, "rb") as f:
+            serialized = f.read()
+        runtime = trt.Runtime(trt_logger)
+        self._engine  = runtime.deserialize_cuda_engine(serialized)
+        self._context = self._engine.create_execution_context()
+        self._stream  = cuda.Stream()
+
+        # Allocate host + device buffers
+        self._bindings = []
+        self._host_in  = None
+        self._dev_in   = None
+        self._host_out = None
+        self._dev_out  = None
+
+        for i in range(self._engine.num_bindings):
+            shape = self._engine.get_binding_shape(i)
+            size  = int(np.prod(shape))
+            dtype = trt.nptype(self._engine.get_binding_dtype(i))
+            host_buf = cuda.pagelocked_empty(size, dtype)
+            dev_buf  = cuda.mem_alloc(host_buf.nbytes)
+            self._bindings.append(int(dev_buf))
+            if self._engine.binding_is_input(i):
+                self._host_in, self._dev_in = host_buf, dev_buf
+                self._in_shape = shape
+            else:
+                self._host_out, self._dev_out = host_buf, dev_buf
+                self._out_shape = shape
+
+        logger.info(f"TRT engine loaded: in={self._in_shape} out={self._out_shape}")
+
+    def infer(self, blob: np.ndarray) -> np.ndarray:
+        np.copyto(self._host_in, blob.ravel())
+        cuda.memcpy_htod_async(self._dev_in, self._host_in, self._stream)
+        self._context.execute_async_v2(self._bindings, self._stream.handle)
+        cuda.memcpy_dtoh_async(self._host_out, self._dev_out, self._stream)
+        self._stream.synchronize()
+        return self._host_out.reshape(self._out_shape)
+
+
+# ── ONNX Runtime backend ──────────────────────────────────────────────────────
+
+try:
+    import onnxruntime as ort
+    _ONNX_AVAILABLE = True
+except ImportError:
+    _ONNX_AVAILABLE = False
+
+
+class _ONNXBackend:
+    """ONNX Runtime inference backend (CUDA or CPU)."""
+
+    def __init__(self, onnx_path: str, logger):
+        providers = []
+        if _ONNX_AVAILABLE:
+            available = ort.get_available_providers()
+            if "CUDAExecutionProvider" in available:
+                providers.append("CUDAExecutionProvider")
+                logger.info("ONNX Runtime: using CUDA provider")
+            else:
+                logger.warn("ONNX Runtime: CUDA not available, falling back to CPU")
+            providers.append("CPUExecutionProvider")
+
+        self._session   = ort.InferenceSession(onnx_path, providers=providers)
+        self._input_name  = self._session.get_inputs()[0].name
+        self._output_name = self._session.get_outputs()[0].name
+        logger.info(f"ONNX model loaded: {onnx_path}")
+
+    def infer(self, blob: np.ndarray) -> np.ndarray:
+        return self._session.run([self._output_name], {self._input_name: blob})[0]
+
+
+# ── ROS2 Node ─────────────────────────────────────────────────────────────────
+
+class SidewalkSegNode(Node):
+
+    def __init__(self):
+        super().__init__("sidewalk_seg")
+
+        # ── Parameters ────────────────────────────────────────────────────────
+        self.declare_parameter("engine_path",
+            "/mnt/nvme/saltybot/models/bisenetv2_cityscapes_512x256.engine")
+        self.declare_parameter("onnx_path",
+            "/mnt/nvme/saltybot/models/bisenetv2_cityscapes_512x256.onnx")
+        self.declare_parameter("input_width",        512)
+        self.declare_parameter("input_height",       256)
+        self.declare_parameter("process_every_n",    2)     # skip frames to save GPU
+        self.declare_parameter("publish_debug_image", False)
+        self.declare_parameter("unknown_as_obstacle", False)
+        self.declare_parameter("costmap_resolution",  0.05)  # metres/cell
+        self.declare_parameter("costmap_range_m",     5.0)   # forward projection range
+        self.declare_parameter("camera_height_m",     0.15)  # RealSense mount height
+        self.declare_parameter("camera_pitch_deg",    0.0)   # tilt angle
+
+        self._p = self._load_params()
+
+        # ── Backend selection (TRT preferred) ──────────────────────────────────
+        self._backend = None
+        self._init_backend()
+
+        # ── Runtime state ─────────────────────────────────────────────────────
+        self._bridge        = CvBridge()
+        self._frame_count   = 0
+        self._last_mask     = None
+        self._last_mask_lock = threading.Lock()
+        self._t_infer        = 0.0
+
+        # ── QoS: sensor data (best-effort, keep-last=1) ────────────────────────
+        sensor_qos = QoSProfile(
+            reliability=ReliabilityPolicy.BEST_EFFORT,
+            history=HistoryPolicy.KEEP_LAST,
+            depth=1,
+        )
+        # Transient local for costmap (Nav2 expects this)
+        costmap_qos = QoSProfile(
+            reliability=ReliabilityPolicy.RELIABLE,
+            history=HistoryPolicy.KEEP_LAST,
+            depth=1,
+            durability=DurabilityPolicy.TRANSIENT_LOCAL,
+        )
+
+        # ── Subscriptions ─────────────────────────────────────────────────────
+        self.create_subscription(
+            Image, "/camera/color/image_raw", self._image_cb, sensor_qos)
+
+        # ── Publishers ────────────────────────────────────────────────────────
+        self._mask_pub  = self.create_publisher(Image, "/segmentation/mask",  10)
+        self._cost_pub  = self.create_publisher(
+            OccupancyGrid, "/segmentation/costmap", costmap_qos)
+        self._debug_pub = self.create_publisher(Image, "/segmentation/debug_image", 1)
+
+        self.get_logger().info(
+            f"SidewalkSeg ready  backend={'trt' if isinstance(self._backend, _TRTBackend) else 'onnx'} "
+            f"input={self._p['input_width']}x{self._p['input_height']} "
+            f"process_every={self._p['process_every_n']} frames"
+        )
+
+    # ── Helpers ────────────────────────────────────────────────────────────────
+
+    def _load_params(self) -> dict:
+        return {
+            "engine_path":        self.get_parameter("engine_path").value,
+            "onnx_path":          self.get_parameter("onnx_path").value,
+            "input_width":        self.get_parameter("input_width").value,
+            "input_height":       self.get_parameter("input_height").value,
+            "process_every_n":    self.get_parameter("process_every_n").value,
+            "publish_debug":      self.get_parameter("publish_debug_image").value,
+            "unknown_as_obstacle":self.get_parameter("unknown_as_obstacle").value,
+            "costmap_resolution": self.get_parameter("costmap_resolution").value,
+            "costmap_range_m":    self.get_parameter("costmap_range_m").value,
+            "camera_height_m":    self.get_parameter("camera_height_m").value,
+            "camera_pitch_deg":   self.get_parameter("camera_pitch_deg").value,
+        }
+
+    def _init_backend(self):
+        p = self._p
+        if _TRT_AVAILABLE:
+            import os
+            if os.path.exists(p["engine_path"]):
+                try:
+                    self._backend = _TRTBackend(p["engine_path"], self.get_logger())
+                    return
+                except Exception as e:
+                    self.get_logger().warn(f"TRT load failed: {e} — trying ONNX")
+
+        if _ONNX_AVAILABLE:
+            import os
+            if os.path.exists(p["onnx_path"]):
+                try:
+                    self._backend = _ONNXBackend(p["onnx_path"], self.get_logger())
+                    return
+                except Exception as e:
+                    self.get_logger().warn(f"ONNX load failed: {e}")
+
+        self.get_logger().warn(
+            "No inference backend available — node will publish empty masks. "
+            "Run build_engine.py to create the TRT engine."
+        )
+
+    # ── Image callback ─────────────────────────────────────────────────────────
+
+    def _image_cb(self, msg: Image):
+        self._frame_count += 1
+        if self._frame_count % self._p["process_every_n"] != 0:
+            return
+
+        try:
+            bgr = self._bridge.imgmsg_to_cv2(msg, desired_encoding="bgr8")
+        except Exception as e:
+            self.get_logger().warn(f"cv_bridge decode error: {e}")
+            return
+
+        orig_h, orig_w = bgr.shape[:2]
+        iw = self._p["input_width"]
+        ih = self._p["input_height"]
+
+        # ── Inference ─────────────────────────────────────────────────────────
+        if self._backend is not None:
+            try:
+                t0 = time.monotonic()
+                blob, scale, pad_l, pad_t = preprocess_for_inference(bgr, iw, ih)
+                raw = self._backend.infer(blob)
+                self._t_infer = time.monotonic() - t0
+
+                # raw shape: (1, num_classes, H, W) or (1, H, W)
+                if raw.ndim == 4:
+                    class_mask = raw[0].argmax(axis=0).astype(np.uint8)
+                else:
+                    class_mask = raw[0].astype(np.uint8)
+
+                # Unpad + restore to original resolution
+                class_mask_full = unpad_mask(
+                    class_mask, orig_h, orig_w, scale, pad_l, pad_t)
+
+                trav_mask = cityscapes_to_traversability(class_mask_full)
+
+            except Exception as e:
+                self.get_logger().warn(
+                    f"Inference error: {e}", throttle_duration_sec=5.0)
+                trav_mask = np.full((orig_h, orig_w), 4, dtype=np.uint8)  # all unknown
+        else:
+            trav_mask = np.full((orig_h, orig_w), 4, dtype=np.uint8)  # all unknown
+
+        with self._last_mask_lock:
+            self._last_mask = trav_mask
+
+        stamp = msg.header.stamp
+
+        # ── Publish segmentation mask ──────────────────────────────────────────
+        mask_msg = self._bridge.cv2_to_imgmsg(trav_mask, encoding="mono8")
+        mask_msg.header.stamp    = stamp
+        mask_msg.header.frame_id = "camera_color_optical_frame"
+        self._mask_pub.publish(mask_msg)
+
+        # ── Publish costmap ────────────────────────────────────────────────────
+        costmap_msg = self._build_costmap(trav_mask, stamp)
+        self._cost_pub.publish(costmap_msg)
+
+        # ── Debug visualisation ────────────────────────────────────────────────
+        if self._p["publish_debug"]:
+            vis = colorise_traversability(trav_mask)
+            debug_msg = self._bridge.cv2_to_imgmsg(vis, encoding="bgr8")
+            debug_msg.header.stamp    = stamp
+            debug_msg.header.frame_id = "camera_color_optical_frame"
+            self._debug_pub.publish(debug_msg)
+
+        if self._frame_count % 30 == 0:
+            fps_str = f"{1.0/self._t_infer:.1f} fps" if self._t_infer > 0 else "no inference"
+            self.get_logger().debug(
+                f"Seg frame {self._frame_count}: {fps_str}",
+                throttle_duration_sec=5.0,
+            )
+
+    # ── Costmap projection ─────────────────────────────────────────────────────
+
+    def _build_costmap(self, trav_mask: np.ndarray, stamp) -> OccupancyGrid:
+        """
+        Project the lower portion of the segmentation mask into a flat
+        OccupancyGrid in the base_link frame.
+
+        The projection uses a simple inverse-perspective ground model:
+          - Only pixels in the lower half of the image are projected
+            (upper half is unlikely to be ground plane in front of robot)
+          - Each pixel row maps to a forward distance using pinhole geometry
+            with the camera mount height and pitch angle.
+          - Columns map to lateral (Y) position via horizontal FOV.
+
+        The resulting OccupancyGrid covers [0, costmap_range_m] forward
+        and [-costmap_range_m/2, costmap_range_m/2] laterally in base_link.
+        """
+        p = self._p
+        res     = p["costmap_resolution"]    # metres per cell
+        rng     = p["costmap_range_m"]       # look-ahead range
+        cam_h   = p["camera_height_m"]
+        cam_pit = np.deg2rad(p["camera_pitch_deg"])
+
+        # Costmap grid dimensions
+        grid_h = int(rng / res)               # forward cells (X direction)
+        grid_w = int(rng / res)               # lateral cells (Y direction)
+        grid_cx = grid_w // 2                 # lateral centre cell
+
+        cost_map_int8 = traversability_to_costmap(
+            trav_mask,
+            unknown_as_obstacle=p["unknown_as_obstacle"],
+        )
+
+        img_h, img_w = trav_mask.shape
+        # Only process lower 60% of image (ground plane region)
+        row_start = int(img_h * 0.40)
+
+        # RealSense D435i approximate intrinsics at 640×480
+        # (horizontal FOV ~87°, vertical FOV ~58°)
+        fx = img_w / (2.0 * np.tan(np.deg2rad(87.0 / 2)))
+        fy = img_h / (2.0 * np.tan(np.deg2rad(58.0 / 2)))
+        cx = img_w / 2.0
+        cy = img_h / 2.0
+
+        # Output occupancy grid (init to -1 = unknown)
+        grid = np.full((grid_h, grid_w), -1, dtype=np.int8)
+
+        for row in range(row_start, img_h):
+            # Vertical angle from optical axis
+            alpha = np.arctan2(-(row - cy), fy) + cam_pit
+            if alpha >= 0:
+                continue  # ray points up — skip
+            # Ground distance from camera base (forward)
+            fwd_dist = cam_h / np.tan(-alpha)
+            if fwd_dist <= 0 or fwd_dist > rng:
+                continue
+
+            grid_row = int(fwd_dist / res)
+            if grid_row >= grid_h:
+                continue
+
+            for col in range(0, img_w):
+                # Lateral angle
+                beta = np.arctan2(col - cx, fx)
+                lat_dist = fwd_dist * np.tan(beta)
+
+                grid_col = grid_cx + int(lat_dist / res)
+                if grid_col < 0 or grid_col >= grid_w:
+                    continue
+
+                cell_cost = int(cost_map_int8[row, col])
+                existing  = int(grid[grid_row, grid_col])
+
+                # Max-cost merge: most conservative estimate wins
+                if existing < 0 or cell_cost > existing:
+                    grid[grid_row, grid_col] = np.int8(cell_cost)
+
+        # Build OccupancyGrid message
+        msg = OccupancyGrid()
+        msg.header.stamp    = stamp
+        msg.header.frame_id = "base_link"
+
+        msg.info = MapMetaData()
+        msg.info.resolution = res
+        msg.info.width      = grid_w
+        msg.info.height     = grid_h
+        msg.info.map_load_time = stamp
+
+        # Origin: lower-left corner in base_link
+        # Grid row 0 = closest (0m forward), row grid_h-1 = rng forward
+        # Grid col 0 = leftmost, col grid_cx = straight ahead
+        msg.info.origin.position.x = 0.0
+        msg.info.origin.position.y = -(rng / 2.0)
+        msg.info.origin.position.z = 0.0
+        msg.info.origin.orientation.w = 1.0
+
+        msg.data = grid.flatten().tolist()
+        return msg
+
+
+# ── Entry point ───────────────────────────────────────────────────────────────
+
+def main(args=None):
+    rclpy.init(args=args)
+    node = SidewalkSegNode()
+    try:
+        rclpy.spin(node)
+    except KeyboardInterrupt:
+        pass
+    finally:
+        node.destroy_node()
+        rclpy.try_shutdown()
+
+
+if __name__ == "__main__":
+    main()
diff --git a/jetson/ros2_ws/src/saltybot_segmentation/scripts/build_engine.py b/jetson/ros2_ws/src/saltybot_segmentation/scripts/build_engine.py
new file mode 100644
index 0000000..5055a71
--- /dev/null
+++ b/jetson/ros2_ws/src/saltybot_segmentation/scripts/build_engine.py
@@ -0,0 +1,398 @@
+#!/usr/bin/env python3
+"""
+build_engine.py — Convert BiSeNetV2/DDRNet PyTorch model → ONNX → TensorRT FP16 engine.
+
+Run ONCE on the Jetson Orin Nano Super. The .engine file is hardware-specific
+(cannot be transferred between machines).
+
+Usage
+─────
+  # Build BiSeNetV2 engine (default, fastest):
+  python3 build_engine.py
+
+  # Build DDRNet-23-slim engine (higher mIoU, slightly slower):
+  python3 build_engine.py --model ddrnet
+
+  # Custom output paths:
+  python3 build_engine.py --onnx /tmp/model.onnx --engine /tmp/model.engine
+
+  # Re-export ONNX from local weights (skip download):
+  python3 build_engine.py --weights /path/to/bisenetv2.pth
+
+Prerequisites
+─────────────
+  pip install torch torchvision onnx onnxruntime-gpu
+  # TensorRT is pre-installed with JetPack 6 at /usr/lib/python3/dist-packages/tensorrt
+
+Outputs
+───────
+  /mnt/nvme/saltybot/models/bisenetv2_cityscapes_512x256.onnx    (FP32)
+  /mnt/nvme/saltybot/models/bisenetv2_cityscapes_512x256.engine  (TRT FP16)
+
+Model sources
+─────────────
+  BiSeNetV2 pretrained on Cityscapes:
+    https://github.com/CoinCheung/BiSeNet (MIT License)
+    Checkpoint: cp/model_final_v2_city.pth (~25MB)
+
+  DDRNet-23-slim pretrained on Cityscapes:
+    https://github.com/ydhongHIT/DDRNet (Apache License)
+    Checkpoint: DDRNet23s_imagenet.pth + Cityscapes fine-tune
+
+Performance on Orin Nano Super (1024-core Ampere, 20 TOPS)
+──────────────────────────────────────────────────────────
+  BiSeNetV2  FP32 ONNX:   ~12ms  (~83fps theoretical)
+  BiSeNetV2  FP16 TRT:    ~5ms   (~200fps theoretical, real ~50fps w/ overhead)
+  DDRNet-23  FP16 TRT:    ~8ms   (~125fps theoretical, real ~40fps)
+  Target:    >15fps including ROS2 overhead at 512×256
+"""
+
+import argparse
+import os
+import sys
+import time
+
+# ── Default paths ─────────────────────────────────────────────────────────────
+
+DEFAULT_MODEL_DIR = "/mnt/nvme/saltybot/models"
+INPUT_W, INPUT_H = 512, 256
+BATCH_SIZE = 1
+
+MODEL_CONFIGS = {
+    "bisenetv2": {
+        "onnx_name":   "bisenetv2_cityscapes_512x256.onnx",
+        "engine_name": "bisenetv2_cityscapes_512x256.engine",
+        "repo_url":    "https://github.com/CoinCheung/BiSeNet.git",
+        "weights_url": "https://github.com/CoinCheung/BiSeNet/releases/download/0.0.0/model_final_v2_city.pth",
+        "num_classes": 19,
+        "description": "BiSeNetV2 Cityscapes — 72.6 mIoU, ~50fps on Orin",
+    },
+    "ddrnet": {
+        "onnx_name":   "ddrnet23s_cityscapes_512x256.onnx",
+        "engine_name": "ddrnet23s_cityscapes_512x256.engine",
+        "repo_url":    "https://github.com/ydhongHIT/DDRNet.git",
+        "weights_url": None,  # must supply manually
+        "num_classes": 19,
+        "description": "DDRNet-23-slim Cityscapes — 79.5 mIoU, ~40fps on Orin",
+    },
+}
+
+
+def parse_args():
+    p = argparse.ArgumentParser(description="Build TensorRT segmentation engine")
+    p.add_argument("--model",   default="bisenetv2",
+                   choices=list(MODEL_CONFIGS.keys()),
+                   help="Model architecture")
+    p.add_argument("--weights", default=None,
+                   help="Path to .pth weights file (downloads if not set)")
+    p.add_argument("--onnx",    default=None, help="Output ONNX path")
+    p.add_argument("--engine",  default=None, help="Output TRT engine path")
+    p.add_argument("--fp32",    action="store_true",
+                   help="Build FP32 engine instead of FP16 (slower, more accurate)")
+    p.add_argument("--workspace-gb", type=float, default=2.0,
+                   help="TRT builder workspace in GB (default 2.0)")
+    p.add_argument("--skip-onnx", action="store_true",
+                   help="Skip ONNX export (use existing .onnx file)")
+    return p.parse_args()
+
+
+def ensure_dir(path: str):
+    os.makedirs(path, exist_ok=True)
+
+
+def download_weights(url: str, dest: str):
+    """Download model weights with progress display."""
+    import urllib.request
+    print(f"  Downloading weights from {url}")
+    print(f"  → {dest}")
+
+    def progress(count, block, total):
+        pct = min(count * block / total * 100, 100)
+        bar = "#" * int(pct / 2)
+        sys.stdout.write(f"\r  [{bar:<50}] {pct:.1f}%")
+        sys.stdout.flush()
+
+    urllib.request.urlretrieve(url, dest, reporthook=progress)
+    print()
+
+
+def export_bisenetv2_onnx(weights_path: str, onnx_path: str, num_classes: int = 19):
+    """
+    Export BiSeNetV2 from CoinCheung/BiSeNet to ONNX.
+
+    Expects BiSeNet repo to be cloned in /tmp/BiSeNet or PYTHONPATH set.
+    """
+    import torch
+
+    # Try to import BiSeNetV2 — clone repo if needed
+    try:
+        sys.path.insert(0, "/tmp/BiSeNet")
+        from lib.models.bisenetv2 import BiSeNetV2
+    except ImportError:
+        print("  Cloning BiSeNet repository to /tmp/BiSeNet ...")
+        os.system("git clone --depth 1 https://github.com/CoinCheung/BiSeNet.git /tmp/BiSeNet")
+        sys.path.insert(0, "/tmp/BiSeNet")
+        from lib.models.bisenetv2 import BiSeNetV2
+
+    print("  Loading BiSeNetV2 weights ...")
+    net = BiSeNetV2(num_classes)
+    state = torch.load(weights_path, map_location="cpu")
+    # Handle both direct state_dict and checkpoint wrapper
+    state_dict = state.get("state_dict", state.get("model", state))
+    # Strip module. prefix from DataParallel checkpoints
+    state_dict = {k.replace("module.", ""): v for k, v in state_dict.items()}
+    net.load_state_dict(state_dict, strict=False)
+    net.eval()
+
+    print(f"  Exporting ONNX → {onnx_path}")
+    dummy = torch.randn(BATCH_SIZE, 3, INPUT_H, INPUT_W)
+
+    import torch.onnx
+    # BiSeNetV2 inference returns (logits, *aux) — we only want logits
+    class _Wrapper(torch.nn.Module):
+        def __init__(self, net):
+            super().__init__()
+            self.net = net
+        def forward(self, x):
+            out = self.net(x)
+            return out[0] if isinstance(out, (list, tuple)) else out
+
+    wrapped = _Wrapper(net)
+    torch.onnx.export(
+        wrapped, dummy, onnx_path,
+        opset_version=12,
+        input_names=["image"],
+        output_names=["logits"],
+        dynamic_axes=None,  # fixed batch=1 for TRT
+        do_constant_folding=True,
+    )
+
+    # Verify
+    import onnx
+    model = onnx.load(onnx_path)
+    onnx.checker.check_model(model)
+    print(f"  ONNX export verified  ({os.path.getsize(onnx_path) / 1e6:.1f} MB)")
+
+
+def export_ddrnet_onnx(weights_path: str, onnx_path: str, num_classes: int = 19):
+    """Export DDRNet-23-slim to ONNX."""
+    import torch
+
+    try:
+        sys.path.insert(0, "/tmp/DDRNet/tools/../lib")
+        from models.ddrnet_23_slim import get_seg_model
+    except ImportError:
+        print("  Cloning DDRNet repository to /tmp/DDRNet ...")
+        os.system("git clone --depth 1 https://github.com/ydhongHIT/DDRNet.git /tmp/DDRNet")
+        sys.path.insert(0, "/tmp/DDRNet/lib")
+        from models.ddrnet_23_slim import get_seg_model
+
+    print("  Loading DDRNet weights ...")
+    net = get_seg_model(num_classes=num_classes)
+    net.load_state_dict(
+        {k.replace("module.", ""): v
+         for k, v in torch.load(weights_path, map_location="cpu").items()},
+        strict=False
+    )
+    net.eval()
+
+    print(f"  Exporting ONNX → {onnx_path}")
+    dummy = torch.randn(BATCH_SIZE, 3, INPUT_H, INPUT_W)
+    import torch.onnx
+    torch.onnx.export(
+        net, dummy, onnx_path,
+        opset_version=12,
+        input_names=["image"],
+        output_names=["logits"],
+        do_constant_folding=True,
+    )
+    import onnx
+    onnx.checker.check_model(onnx.load(onnx_path))
+    print(f"  ONNX export verified  ({os.path.getsize(onnx_path) / 1e6:.1f} MB)")
+
+
+def build_trt_engine(onnx_path: str, engine_path: str,
+                     fp16: bool = True, workspace_gb: float = 2.0):
+    """
+    Build a TensorRT engine from an ONNX model.
+
+    Uses explicit batch dimension (not implicit batch).
+    Enables FP16 mode by default (2× speedup on Orin Ampere vs FP32).
+    """
+    try:
+        import tensorrt as trt
+    except ImportError:
+        print("ERROR: TensorRT not found. Install JetPack 6 or:")
+        print("  pip install tensorrt  (x86 only)")
+        sys.exit(1)
+
+    logger = trt.Logger(trt.Logger.INFO)
+
+    print(f"\n  Building TRT engine ({'FP16' if fp16 else 'FP32'}) from: {onnx_path}")
+    print(f"  Output: {engine_path}")
+    print(f"  Workspace: {workspace_gb:.1f} GB")
+    print("  This may take 5–15 minutes on first build (layer calibration)...")
+
+    t0 = time.time()
+
+    builder = trt.Builder(logger)
+    network = builder.create_network(
+        1 << int(trt.NetworkDefinitionCreationFlag.EXPLICIT_BATCH)
+    )
+    parser  = trt.OnnxParser(network, logger)
+    config  = builder.create_builder_config()
+
+    # Workspace
+    config.set_memory_pool_limit(
+        trt.MemoryPoolType.WORKSPACE, int(workspace_gb * 1024**3)
+    )
+
+    # FP16 precision
+    if fp16 and builder.platform_has_fast_fp16:
+        config.set_flag(trt.BuilderFlag.FP16)
+        print("  FP16 mode enabled")
+    elif fp16:
+        print("  WARNING: FP16 not available on this platform, using FP32")
+
+    # Parse ONNX
+    with open(onnx_path, "rb") as f:
+        if not parser.parse(f.read()):
+            for i in range(parser.num_errors):
+                print(f"  ONNX parse error: {parser.get_error(i)}")
+            sys.exit(1)
+
+    print(f"  Network: {network.num_inputs} input(s), {network.num_outputs} output(s)")
+    inp = network.get_input(0)
+    print(f"  Input shape: {inp.shape}  dtype: {inp.dtype}")
+
+    # Build
+    serialized_engine = builder.build_serialized_network(network, config)
+    if serialized_engine is None:
+        print("ERROR: TRT engine build failed")
+        sys.exit(1)
+
+    with open(engine_path, "wb") as f:
+        f.write(serialized_engine)
+
+    elapsed = time.time() - t0
+    size_mb = os.path.getsize(engine_path) / 1e6
+    print(f"\n  Engine built in {elapsed:.1f}s  ({size_mb:.1f} MB)")
+    print(f"  Saved: {engine_path}")
+
+
+def validate_engine(engine_path: str):
+    """Run a dummy inference to confirm the engine works and measure latency."""
+    try:
+        import tensorrt as trt
+        import pycuda.driver as cuda
+        import pycuda.autoinit  # noqa
+        import numpy as np
+    except ImportError:
+        print("  Skipping validation (pycuda not available)")
+        return
+
+    print("\n  Validating engine with dummy input...")
+    trt_logger = trt.Logger(trt.Logger.WARNING)
+    with open(engine_path, "rb") as f:
+        engine = trt.Runtime(trt_logger).deserialize_cuda_engine(f.read())
+    ctx = engine.create_execution_context()
+    stream = cuda.Stream()
+
+    bindings = []
+    host_in = host_out = dev_in = dev_out = None
+    for i in range(engine.num_bindings):
+        shape = engine.get_binding_shape(i)
+        dtype = trt.nptype(engine.get_binding_dtype(i))
+        h_buf = cuda.pagelocked_empty(int(np.prod(shape)), dtype)
+        d_buf = cuda.mem_alloc(h_buf.nbytes)
+        bindings.append(int(d_buf))
+        if engine.binding_is_input(i):
+            host_in, dev_in = h_buf, d_buf
+            host_in[:] = np.random.randn(*shape).astype(dtype).ravel()
+        else:
+            host_out, dev_out = h_buf, d_buf
+
+    # Warm up
+    for _ in range(5):
+        cuda.memcpy_htod_async(dev_in, host_in, stream)
+        ctx.execute_async_v2(bindings, stream.handle)
+        cuda.memcpy_dtoh_async(host_out, dev_out, stream)
+        stream.synchronize()
+
+    # Benchmark
+    N = 20
+    t0 = time.time()
+    for _ in range(N):
+        cuda.memcpy_htod_async(dev_in, host_in, stream)
+        ctx.execute_async_v2(bindings, stream.handle)
+        cuda.memcpy_dtoh_async(host_out, dev_out, stream)
+        stream.synchronize()
+    elapsed_ms = (time.time() - t0) * 1000 / N
+
+    out_shape = engine.get_binding_shape(engine.num_bindings - 1)
+    print(f"  Output shape: {out_shape}")
+    print(f"  Inference latency: {elapsed_ms:.1f}ms ({1000/elapsed_ms:.1f} fps) [avg {N} runs]")
+    if elapsed_ms < 1000 / 15:
+        print("  PASS: target >15fps achieved")
+    else:
+        print(f"  WARNING: latency {elapsed_ms:.1f}ms > target {1000/15:.1f}ms")
+
+
+def main():
+    args = parse_args()
+    cfg = MODEL_CONFIGS[args.model]
+    print(f"\nBuilding TRT engine for: {cfg['description']}")
+
+    ensure_dir(DEFAULT_MODEL_DIR)
+
+    onnx_path   = args.onnx   or os.path.join(DEFAULT_MODEL_DIR, cfg["onnx_name"])
+    engine_path = args.engine or os.path.join(DEFAULT_MODEL_DIR, cfg["engine_name"])
+
+    # ── Step 1: Download weights if needed ────────────────────────────────────
+    if not args.skip_onnx:
+        weights_path = args.weights
+        if weights_path is None:
+            if cfg["weights_url"] is None:
+                print(f"ERROR: No weights URL for {args.model}. Supply --weights /path/to.pth")
+                sys.exit(1)
+            weights_path = os.path.join(DEFAULT_MODEL_DIR, f"{args.model}_cityscapes.pth")
+            if not os.path.exists(weights_path):
+                print("\nStep 1: Downloading pretrained weights")
+                download_weights(cfg["weights_url"], weights_path)
+            else:
+                print(f"\nStep 1: Using cached weights: {weights_path}")
+        else:
+            print(f"\nStep 1: Using provided weights: {weights_path}")
+
+        # ── Step 2: Export ONNX ────────────────────────────────────────────────
+        print(f"\nStep 2: Exporting {args.model.upper()} to ONNX ({INPUT_W}×{INPUT_H})")
+        if args.model == "bisenetv2":
+            export_bisenetv2_onnx(weights_path, onnx_path, cfg["num_classes"])
+        else:
+            export_ddrnet_onnx(weights_path, onnx_path, cfg["num_classes"])
+    else:
+        print(f"\nStep 1+2: Skipping ONNX export, using: {onnx_path}")
+        if not os.path.exists(onnx_path):
+            print(f"ERROR: ONNX file not found: {onnx_path}")
+            sys.exit(1)
+
+    # ── Step 3: Build TRT engine ───────────────────────────────────────────────
+    print(f"\nStep 3: Building TensorRT engine")
+    build_trt_engine(
+        onnx_path, engine_path,
+        fp16=not args.fp32,
+        workspace_gb=args.workspace_gb,
+    )
+
+    # ── Step 4: Validate ───────────────────────────────────────────────────────
+    print(f"\nStep 4: Validating engine")
+    validate_engine(engine_path)
+
+    print(f"\nDone. Engine: {engine_path}")
+    print("Start the node:")
+    print(f"  ros2 launch saltybot_segmentation sidewalk_segmentation.launch.py \\")
+    print(f"    engine_path:={engine_path}")
+
+
+if __name__ == "__main__":
+    main()
diff --git a/jetson/ros2_ws/src/saltybot_segmentation/scripts/fine_tune.py b/jetson/ros2_ws/src/saltybot_segmentation/scripts/fine_tune.py
new file mode 100644
index 0000000..5e9fb46
--- /dev/null
+++ b/jetson/ros2_ws/src/saltybot_segmentation/scripts/fine_tune.py
@@ -0,0 +1,400 @@
+#!/usr/bin/env python3
+"""
+fine_tune.py — Fine-tune BiSeNetV2 on custom sidewalk data.
+
+Walk-and-label workflow:
+  1. Record a ROS2 bag while walking the route:
+       ros2 bag record /camera/color/image_raw -o sidewalk_route
+  2. Extract frames from the bag:
+       python3 fine_tune.py --extract-frames sidewalk_route/ --output-dir data/raw/ --every-n 5
+  3. Label 50+ frames in LabelMe (or CVAT):
+       labelme data/raw/  (save as JSON)
+  4. Convert labels to Cityscapes-format masks:
+       python3 fine_tune.py --convert-labels data/raw/ --output-dir data/labels/
+  5. Fine-tune:
+       python3 fine_tune.py --train --images data/raw/ --labels data/labels/ \
+           --weights /mnt/nvme/saltybot/models/bisenetv2_cityscapes.pth \
+           --output /mnt/nvme/saltybot/models/bisenetv2_custom.pth
+  6. Build new TRT engine:
+       python3 build_engine.py --weights /mnt/nvme/saltybot/models/bisenetv2_custom.pth
+
+LabelMe class names (must match exactly in labelme JSON):
+  sidewalk  → Cityscapes ID 1 → TRAV_SIDEWALK
+  road      → Cityscapes ID 0 → TRAV_ROAD
+  grass     → Cityscapes ID 8 → TRAV_GRASS (use 'vegetation')
+  obstacle  → Cityscapes ID 2 → TRAV_OBSTACLE (use 'building' for static)
+  person    → Cityscapes ID 11
+  car       → Cityscapes ID 13
+
+Requirements:
+  pip install torch torchvision albumentations labelme opencv-python
+"""
+
+import argparse
+import json
+import os
+import sys
+
+import numpy as np
+
+# ── Label → Cityscapes ID mapping for custom annotation ──────────────────────
+
+LABEL_TO_CITYSCAPES = {
+    "road":        0,
+    "sidewalk":    1,
+    "building":    2,
+    "wall":        3,
+    "fence":       4,
+    "pole":        5,
+    "traffic light": 6,
+    "traffic sign":  7,
+    "vegetation":  8,
+    "grass":       8,   # alias
+    "terrain":     9,
+    "sky":         10,
+    "person":      11,
+    "rider":       12,
+    "car":         13,
+    "truck":       14,
+    "bus":         15,
+    "train":       16,
+    "motorcycle":  17,
+    "bicycle":     18,
+    # saltybot-specific aliases
+    "kerb":        1,   # map kerb → sidewalk
+    "pavement":    1,   # British English
+    "path":        1,
+    "tarmac":      0,   # map tarmac → road
+    "shrub":       8,   # map shrub → vegetation
+}
+
+DEFAULT_CLASS = 255  # unlabelled pixels → ignore in loss
+
+
+def parse_args():
+    p = argparse.ArgumentParser(description="Fine-tune BiSeNetV2 on custom data")
+    p.add_argument("--extract-frames", metavar="BAG_DIR",
+                   help="Extract frames from a ROS2 bag")
+    p.add_argument("--output-dir",     default="data/raw",
+                   help="Output directory for extracted frames or converted labels")
+    p.add_argument("--every-n",        type=int, default=5,
+                   help="Extract every N-th frame from bag")
+    p.add_argument("--convert-labels", metavar="LABELME_DIR",
+                   help="Convert LabelMe JSON annotations to Cityscapes masks")
+    p.add_argument("--train",          action="store_true",
+                   help="Run fine-tuning loop")
+    p.add_argument("--images",         default="data/raw",
+                   help="Directory of training images")
+    p.add_argument("--labels",         default="data/labels",
+                   help="Directory of label masks (PNG, Cityscapes IDs)")
+    p.add_argument("--weights",        required=False,
+                   default="/mnt/nvme/saltybot/models/bisenetv2_cityscapes.pth",
+                   help="Path to pretrained BiSeNetV2 weights")
+    p.add_argument("--output",
+                   default="/mnt/nvme/saltybot/models/bisenetv2_custom.pth",
+                   help="Output path for fine-tuned weights")
+    p.add_argument("--epochs",         type=int, default=20)
+    p.add_argument("--lr",             type=float, default=1e-4)
+    p.add_argument("--batch-size",     type=int, default=4)
+    p.add_argument("--input-size",     nargs=2, type=int, default=[512, 256],
+                   help="Model input size: W H")
+    p.add_argument("--eval",           action="store_true",
+                   help="Evaluate mIoU on labelled data instead of training")
+    return p.parse_args()
+
+
+# ── Frame extraction from ROS2 bag ────────────────────────────────────────────
+
+def extract_frames(bag_dir: str, output_dir: str, every_n: int = 5):
+    """Extract /camera/color/image_raw frames from a ROS2 bag."""
+    try:
+        import rclpy
+        from rosbag2_py import SequentialReader, StorageOptions, ConverterOptions
+        from rclpy.serialization import deserialize_message
+        from sensor_msgs.msg import Image
+        from cv_bridge import CvBridge
+        import cv2
+    except ImportError:
+        print("ERROR: rosbag2_py / rclpy not available. Must run in ROS2 environment.")
+        sys.exit(1)
+
+    os.makedirs(output_dir, exist_ok=True)
+    bridge = CvBridge()
+
+    reader = SequentialReader()
+    reader.open(
+        StorageOptions(uri=bag_dir, storage_id="sqlite3"),
+        ConverterOptions("", ""),
+    )
+
+    topic = "/camera/color/image_raw"
+    count = 0
+    saved = 0
+
+    while reader.has_next():
+        topic_name, data, ts = reader.read_next()
+        if topic_name != topic:
+            continue
+        count += 1
+        if count % every_n != 0:
+            continue
+
+        msg = deserialize_message(data, Image)
+        bgr = bridge.imgmsg_to_cv2(msg, "bgr8")
+        fname = os.path.join(output_dir, f"frame_{ts:020d}.jpg")
+        cv2.imwrite(fname, bgr, [cv2.IMWRITE_JPEG_QUALITY, 95])
+        saved += 1
+        if saved % 10 == 0:
+            print(f"  Saved {saved} frames...")
+
+    print(f"Extracted {saved} frames from {count} total to {output_dir}")
+
+
+# ── LabelMe JSON → Cityscapes mask ───────────────────────────────────────────
+
+def convert_labelme_to_masks(labelme_dir: str, output_dir: str):
+    """Convert LabelMe polygon annotations to per-pixel Cityscapes-ID PNG masks."""
+    try:
+        import cv2
+    except ImportError:
+        print("ERROR: opencv-python not installed. pip install opencv-python")
+        sys.exit(1)
+
+    os.makedirs(output_dir, exist_ok=True)
+    json_files = [f for f in os.listdir(labelme_dir) if f.endswith(".json")]
+
+    if not json_files:
+        print(f"No .json annotation files found in {labelme_dir}")
+        sys.exit(1)
+
+    print(f"Converting {len(json_files)} annotation files...")
+    for jf in json_files:
+        with open(os.path.join(labelme_dir, jf)) as f:
+            anno = json.load(f)
+
+        h = anno["imageHeight"]
+        w = anno["imageWidth"]
+        mask = np.full((h, w), DEFAULT_CLASS, dtype=np.uint8)
+
+        for shape in anno.get("shapes", []):
+            label = shape["label"].lower().strip()
+            cid = LABEL_TO_CITYSCAPES.get(label)
+            if cid is None:
+                print(f"  WARNING: unknown label '{label}' in {jf} — skipping")
+                continue
+
+            pts = np.array(shape["points"], dtype=np.int32)
+            cv2.fillPoly(mask, [pts], cid)
+
+        out_name = os.path.splitext(jf)[0] + "_mask.png"
+        cv2.imwrite(os.path.join(output_dir, out_name), mask)
+
+    print(f"Masks saved to {output_dir}")
+
+
+# ── Training loop ─────────────────────────────────────────────────────────────
+
+def train(args):
+    """Fine-tune BiSeNetV2 with cross-entropy loss + ignore_index=255."""
+    try:
+        import torch
+        import torch.nn as nn
+        import torch.optim as optim
+        from torch.utils.data import Dataset, DataLoader
+        import cv2
+        import albumentations as A
+        from albumentations.pytorch import ToTensorV2
+    except ImportError as e:
+        print(f"ERROR: missing dependency — {e}")
+        print("pip install torch torchvision albumentations opencv-python")
+        sys.exit(1)
+
+    # -- Dataset ---------------------------------------------------------------
+    class SegDataset(Dataset):
+        def __init__(self, img_dir, lbl_dir, transform=None):
+            self.imgs = sorted([
+                os.path.join(img_dir, f)
+                for f in os.listdir(img_dir)
+                if f.endswith((".jpg", ".png"))
+            ])
+            self.lbls = sorted([
+                os.path.join(lbl_dir, f)
+                for f in os.listdir(lbl_dir)
+                if f.endswith(".png")
+            ])
+            if len(self.imgs) != len(self.lbls):
+                raise ValueError(
+                    f"Image/label count mismatch: {len(self.imgs)} vs {len(self.lbls)}"
+                )
+            self.transform = transform
+
+        def __len__(self): return len(self.imgs)
+
+        def __getitem__(self, idx):
+            img = cv2.cvtColor(cv2.imread(self.imgs[idx]), cv2.COLOR_BGR2RGB)
+            lbl = cv2.imread(self.lbls[idx], cv2.IMREAD_GRAYSCALE)
+            if self.transform:
+                aug = self.transform(image=img, mask=lbl)
+                img, lbl = aug["image"], aug["mask"]
+            return img, lbl.long()
+
+    iw, ih = args.input_size
+    transform = A.Compose([
+        A.Resize(ih, iw),
+        A.HorizontalFlip(p=0.5),
+        A.ColorJitter(brightness=0.3, contrast=0.3, saturation=0.3, hue=0.1, p=0.5),
+        A.Normalize(mean=(0.485, 0.456, 0.406), std=(0.229, 0.224, 0.225)),
+        ToTensorV2(),
+    ])
+
+    dataset = SegDataset(args.images, args.labels, transform=transform)
+    loader  = DataLoader(dataset, batch_size=args.batch_size, shuffle=True,
+                         num_workers=2, pin_memory=True)
+    print(f"Dataset: {len(dataset)} samples  batch={args.batch_size}")
+
+    # -- Model -----------------------------------------------------------------
+    sys.path.insert(0, "/tmp/BiSeNet")
+    try:
+        from lib.models.bisenetv2 import BiSeNetV2
+    except ImportError:
+        os.system("git clone --depth 1 https://github.com/CoinCheung/BiSeNet.git /tmp/BiSeNet")
+        from lib.models.bisenetv2 import BiSeNetV2
+
+    net = BiSeNetV2(n_classes=19)
+    state = torch.load(args.weights, map_location="cpu")
+    state_dict = state.get("state_dict", state.get("model", state))
+    state_dict = {k.replace("module.", ""): v for k, v in state_dict.items()}
+    net.load_state_dict(state_dict, strict=False)
+
+    device = "cuda" if torch.cuda.is_available() else "cpu"
+    net = net.to(device)
+    print(f"Training on: {device}")
+
+    # -- Optimiser (low LR to preserve Cityscapes knowledge) -------------------
+    optimiser = optim.AdamW(net.parameters(), lr=args.lr, weight_decay=1e-4)
+    scheduler = optim.lr_scheduler.CosineAnnealingLR(optimiser, T_max=args.epochs)
+    criterion = nn.CrossEntropyLoss(ignore_index=DEFAULT_CLASS)
+
+    # -- Loop ------------------------------------------------------------------
+    best_loss = float("inf")
+    for epoch in range(1, args.epochs + 1):
+        net.train()
+        total_loss = 0.0
+
+        for imgs, lbls in loader:
+            imgs = imgs.to(device, dtype=torch.float32)
+            lbls = lbls.to(device)
+
+            out = net(imgs)
+            logits = out[0] if isinstance(out, (list, tuple)) else out
+
+            loss = criterion(logits, lbls)
+            optimiser.zero_grad()
+            loss.backward()
+            optimiser.step()
+            total_loss += loss.item()
+
+        scheduler.step()
+        avg = total_loss / len(loader)
+        print(f"  Epoch {epoch:3d}/{args.epochs}  loss={avg:.4f}  lr={scheduler.get_last_lr()[0]:.2e}")
+
+        if avg < best_loss:
+            best_loss = avg
+            torch.save(net.state_dict(), args.output)
+            print(f"  Saved best model → {args.output}")
+
+    print(f"\nFine-tuning done. Best loss: {best_loss:.4f}  Saved: {args.output}")
+    print("\nNext step: rebuild TRT engine:")
+    print(f"  python3 build_engine.py --weights {args.output}")
+
+
+# ── mIoU evaluation ───────────────────────────────────────────────────────────
+
+def evaluate_miou(args):
+    """Compute mIoU on labelled validation data."""
+    try:
+        import torch
+        import cv2
+    except ImportError:
+        print("ERROR: torch/cv2 not available")
+        sys.exit(1)
+
+    from saltybot_segmentation.seg_utils import cityscapes_to_traversability
+
+    NUM_CLASSES = 19
+    confusion = np.zeros((NUM_CLASSES, NUM_CLASSES), dtype=np.int64)
+
+    sys.path.insert(0, "/tmp/BiSeNet")
+    from lib.models.bisenetv2 import BiSeNetV2
+    import torch
+
+    net = BiSeNetV2(n_classes=NUM_CLASSES)
+    state_dict = {k.replace("module.", ""): v
+                  for k, v in torch.load(args.weights, map_location="cpu").items()}
+    net.load_state_dict(state_dict, strict=False)
+    net.eval().cuda() if torch.cuda.is_available() else net.eval()
+    device = next(net.parameters()).device
+
+    iw, ih = args.input_size
+    img_files = sorted([f for f in os.listdir(args.images) if f.endswith((".jpg", ".png"))])
+    lbl_files = sorted([f for f in os.listdir(args.labels) if f.endswith(".png")])
+
+    from saltybot_segmentation.seg_utils import preprocess_for_inference, unpad_mask
+
+    with torch.no_grad():
+        for imgf, lblf in zip(img_files, lbl_files):
+            img = cv2.imread(os.path.join(args.images, imgf))
+            lbl = cv2.imread(os.path.join(args.labels, lblf), cv2.IMREAD_GRAYSCALE)
+            H, W = img.shape[:2]
+
+            blob, scale, pad_l, pad_t = preprocess_for_inference(img, iw, ih)
+            t_blob = torch.from_numpy(blob).to(device)
+            out = net(t_blob)
+            logits = out[0] if isinstance(out, (list, tuple)) else out
+            pred = logits[0].argmax(0).cpu().numpy().astype(np.uint8)
+            pred = unpad_mask(pred, H, W, scale, pad_l, pad_t)
+
+            valid = lbl != DEFAULT_CLASS
+            np.add.at(confusion, (lbl[valid].ravel(), pred[valid].ravel()), 1)
+
+    # Per-class IoU
+    iou_per_class = []
+    for c in range(NUM_CLASSES):
+        tp = confusion[c, c]
+        fp = confusion[:, c].sum() - tp
+        fn = confusion[c, :].sum() - tp
+        denom = tp + fp + fn
+        iou_per_class.append(tp / denom if denom > 0 else float("nan"))
+
+    valid_iou = [v for v in iou_per_class if not np.isnan(v)]
+    miou = np.mean(valid_iou)
+
+    CITYSCAPES_NAMES = ["road", "sidewalk", "building", "wall", "fence", "pole",
+                        "traffic light", "traffic sign", "vegetation", "terrain",
+                        "sky", "person", "rider", "car", "truck", "bus", "train",
+                        "motorcycle", "bicycle"]
+    print("\nmIoU per class:")
+    for i, (name, iou) in enumerate(zip(CITYSCAPES_NAMES, iou_per_class)):
+        marker = " *" if not np.isnan(iou) else ""
+        print(f"  {i:2d} {name:<16} {iou*100:5.1f}%{marker}")
+    print(f"\nmIoU: {miou*100:.2f}%  ({len(valid_iou)}/{NUM_CLASSES} classes present)")
+
+
+def main():
+    args = parse_args()
+
+    if args.extract_frames:
+        extract_frames(args.extract_frames, args.output_dir, args.every_n)
+    elif args.convert_labels:
+        convert_labelme_to_masks(args.convert_labels, args.output_dir)
+    elif args.eval:
+        evaluate_miou(args)
+    elif args.train:
+        train(args)
+    else:
+        print("Specify one of: --extract-frames, --convert-labels, --train, --eval")
+        sys.exit(1)
+
+
+if __name__ == "__main__":
+    main()
diff --git a/jetson/ros2_ws/src/saltybot_segmentation/setup.cfg b/jetson/ros2_ws/src/saltybot_segmentation/setup.cfg
new file mode 100644
index 0000000..91415cc
--- /dev/null
+++ b/jetson/ros2_ws/src/saltybot_segmentation/setup.cfg
@@ -0,0 +1,4 @@
+[develop]
+script_dir=$base/lib/saltybot_segmentation
+[install]
+install_scripts=$base/lib/saltybot_segmentation
diff --git a/jetson/ros2_ws/src/saltybot_segmentation/setup.py b/jetson/ros2_ws/src/saltybot_segmentation/setup.py
new file mode 100644
index 0000000..720b088
--- /dev/null
+++ b/jetson/ros2_ws/src/saltybot_segmentation/setup.py
@@ -0,0 +1,36 @@
+from setuptools import setup
+import os
+from glob import glob
+
+package_name = "saltybot_segmentation"
+
+setup(
+    name=package_name,
+    version="0.1.0",
+    packages=[package_name],
+    data_files=[
+        ("share/ament_index/resource_index/packages",
+            ["resource/" + package_name]),
+        ("share/" + package_name, ["package.xml"]),
+        (os.path.join("share", package_name, "launch"),
+            glob("launch/*.py")),
+        (os.path.join("share", package_name, "config"),
+            glob("config/*.yaml")),
+        (os.path.join("share", package_name, "scripts"),
+            glob("scripts/*.py")),
+        (os.path.join("share", package_name, "docs"),
+            glob("docs/*.md")),
+    ],
+    install_requires=["setuptools"],
+    zip_safe=True,
+    maintainer="seb",
+    maintainer_email="seb@vayrette.com",
+    description="Semantic sidewalk segmentation for SaltyBot (BiSeNetV2/DDRNet TensorRT)",
+    license="MIT",
+    tests_require=["pytest"],
+    entry_points={
+        "console_scripts": [
+            "sidewalk_seg = saltybot_segmentation.sidewalk_seg_node:main",
+        ],
+    },
+)
diff --git a/jetson/ros2_ws/src/saltybot_segmentation/test/test_seg_utils.py b/jetson/ros2_ws/src/saltybot_segmentation/test/test_seg_utils.py
new file mode 100644
index 0000000..3a78cf1
--- /dev/null
+++ b/jetson/ros2_ws/src/saltybot_segmentation/test/test_seg_utils.py
@@ -0,0 +1,168 @@
+"""
+test_seg_utils.py — Unit tests for seg_utils pure helpers.
+
+No ROS2 / TensorRT / cv2 runtime required — plain pytest with numpy.
+"""
+
+import numpy as np
+import pytest
+
+from saltybot_segmentation.seg_utils import (
+    TRAV_SIDEWALK, TRAV_GRASS, TRAV_ROAD, TRAV_OBSTACLE, TRAV_UNKNOWN,
+    TRAV_TO_COST,
+    cityscapes_to_traversability,
+    traversability_to_costmap,
+)
+
+
+# ── cityscapes_to_traversability ──────────────────────────────────────────────
+
+class TestCitiyscapesToTraversability:
+
+    def test_sidewalk_maps_to_free(self):
+        mask = np.array([[1]], dtype=np.uint8)  # Cityscapes: sidewalk
+        result = cityscapes_to_traversability(mask)
+        assert result[0, 0] == TRAV_SIDEWALK
+
+    def test_road_maps_to_road(self):
+        mask = np.array([[0]], dtype=np.uint8)  # Cityscapes: road
+        result = cityscapes_to_traversability(mask)
+        assert result[0, 0] == TRAV_ROAD
+
+    def test_vegetation_maps_to_grass(self):
+        mask = np.array([[8]], dtype=np.uint8)  # Cityscapes: vegetation
+        result = cityscapes_to_traversability(mask)
+        assert result[0, 0] == TRAV_GRASS
+
+    def test_terrain_maps_to_grass(self):
+        mask = np.array([[9]], dtype=np.uint8)  # Cityscapes: terrain
+        result = cityscapes_to_traversability(mask)
+        assert result[0, 0] == TRAV_GRASS
+
+    def test_building_maps_to_obstacle(self):
+        mask = np.array([[2]], dtype=np.uint8)  # Cityscapes: building
+        result = cityscapes_to_traversability(mask)
+        assert result[0, 0] == TRAV_OBSTACLE
+
+    def test_person_maps_to_obstacle(self):
+        mask = np.array([[11]], dtype=np.uint8)  # Cityscapes: person
+        result = cityscapes_to_traversability(mask)
+        assert result[0, 0] == TRAV_OBSTACLE
+
+    def test_car_maps_to_obstacle(self):
+        mask = np.array([[13]], dtype=np.uint8)  # Cityscapes: car
+        result = cityscapes_to_traversability(mask)
+        assert result[0, 0] == TRAV_OBSTACLE
+
+    def test_sky_maps_to_unknown(self):
+        mask = np.array([[10]], dtype=np.uint8)  # Cityscapes: sky
+        result = cityscapes_to_traversability(mask)
+        assert result[0, 0] == TRAV_UNKNOWN
+
+    def test_all_dynamic_obstacles_are_lethal(self):
+        # person=11, rider=12, car=13, truck=14, bus=15, train=16, motorcycle=17, bicycle=18
+        for cid in [11, 12, 13, 14, 15, 16, 17, 18]:
+            mask = np.array([[cid]], dtype=np.uint8)
+            result = cityscapes_to_traversability(mask)
+            assert result[0, 0] == TRAV_OBSTACLE, f"class {cid} should be OBSTACLE"
+
+    def test_all_static_obstacles_are_lethal(self):
+        # building=2, wall=3, fence=4, pole=5, traffic light=6, sign=7
+        for cid in [2, 3, 4, 5, 6, 7]:
+            mask = np.array([[cid]], dtype=np.uint8)
+            result = cityscapes_to_traversability(mask)
+            assert result[0, 0] == TRAV_OBSTACLE, f"class {cid} should be OBSTACLE"
+
+    def test_out_of_range_id_clamped(self):
+        """Class IDs beyond 18 should not crash — clamped to 18."""
+        mask = np.array([[200]], dtype=np.uint8)
+        result = cityscapes_to_traversability(mask)
+        assert result[0, 0] in range(5)  # valid traversability class
+
+    def test_multi_class_image(self):
+        """A 2×3 image with mixed classes maps correctly."""
+        mask = np.array([
+            [1, 0, 8],   # sidewalk, road, vegetation
+            [2, 11, 10], # building, person, sky
+        ], dtype=np.uint8)
+        result = cityscapes_to_traversability(mask)
+        assert result[0, 0] == TRAV_SIDEWALK
+        assert result[0, 1] == TRAV_ROAD
+        assert result[0, 2] == TRAV_GRASS
+        assert result[1, 0] == TRAV_OBSTACLE
+        assert result[1, 1] == TRAV_OBSTACLE
+        assert result[1, 2] == TRAV_UNKNOWN
+
+    def test_output_dtype_is_uint8(self):
+        mask = np.zeros((4, 4), dtype=np.uint8)
+        result = cityscapes_to_traversability(mask)
+        assert result.dtype == np.uint8
+
+    def test_output_shape_preserved(self):
+        mask = np.zeros((32, 64), dtype=np.uint8)
+        result = cityscapes_to_traversability(mask)
+        assert result.shape == (32, 64)
+
+
+# ── traversability_to_costmap ─────────────────────────────────────────────────
+
+class TestTraversabilityToCostmap:
+
+    def test_sidewalk_is_free(self):
+        mask = np.array([[TRAV_SIDEWALK]], dtype=np.uint8)
+        cost = traversability_to_costmap(mask)
+        assert cost[0, 0] == 0
+
+    def test_road_has_high_cost(self):
+        mask = np.array([[TRAV_ROAD]], dtype=np.uint8)
+        cost = traversability_to_costmap(mask)
+        assert 50 < cost[0, 0] < 100  # high but not lethal
+
+    def test_grass_has_medium_cost(self):
+        mask = np.array([[TRAV_GRASS]], dtype=np.uint8)
+        cost = traversability_to_costmap(mask)
+        grass_cost = TRAV_TO_COST[TRAV_GRASS]
+        assert cost[0, 0] == grass_cost
+        assert grass_cost < TRAV_TO_COST[TRAV_ROAD]  # grass < road cost
+
+    def test_obstacle_is_lethal(self):
+        mask = np.array([[TRAV_OBSTACLE]], dtype=np.uint8)
+        cost = traversability_to_costmap(mask)
+        assert cost[0, 0] == 100
+
+    def test_unknown_is_neg1_by_default(self):
+        mask = np.array([[TRAV_UNKNOWN]], dtype=np.uint8)
+        cost = traversability_to_costmap(mask)
+        assert cost[0, 0] == -1
+
+    def test_unknown_as_obstacle_flag(self):
+        mask = np.array([[TRAV_UNKNOWN]], dtype=np.uint8)
+        cost = traversability_to_costmap(mask, unknown_as_obstacle=True)
+        assert cost[0, 0] == 100
+
+    def test_cost_ordering(self):
+        """sidewalk < grass < road < obstacle."""
+        assert TRAV_TO_COST[TRAV_SIDEWALK] < TRAV_TO_COST[TRAV_GRASS]
+        assert TRAV_TO_COST[TRAV_GRASS]    < TRAV_TO_COST[TRAV_ROAD]
+        assert TRAV_TO_COST[TRAV_ROAD]     < TRAV_TO_COST[TRAV_OBSTACLE]
+
+    def test_output_dtype_is_int8(self):
+        mask = np.zeros((4, 4), dtype=np.uint8)
+        cost = traversability_to_costmap(mask)
+        assert cost.dtype == np.int8
+
+    def test_output_shape_preserved(self):
+        mask = np.zeros((16, 32), dtype=np.uint8)
+        cost = traversability_to_costmap(mask)
+        assert cost.shape == (16, 32)
+
+    def test_mixed_mask(self):
+        mask = np.array([
+            [TRAV_SIDEWALK, TRAV_ROAD],
+            [TRAV_OBSTACLE, TRAV_UNKNOWN],
+        ], dtype=np.uint8)
+        cost = traversability_to_costmap(mask)
+        assert cost[0, 0] == TRAV_TO_COST[TRAV_SIDEWALK]
+        assert cost[0, 1] == TRAV_TO_COST[TRAV_ROAD]
+        assert cost[1, 0] == TRAV_TO_COST[TRAV_OBSTACLE]
+        assert cost[1, 1] == -1  # unknown
diff --git a/jetson/ros2_ws/src/saltybot_segmentation_costmap/CMakeLists.txt b/jetson/ros2_ws/src/saltybot_segmentation_costmap/CMakeLists.txt
new file mode 100644
index 0000000..e53dc52
--- /dev/null
+++ b/jetson/ros2_ws/src/saltybot_segmentation_costmap/CMakeLists.txt
@@ -0,0 +1,70 @@
+cmake_minimum_required(VERSION 3.8)
+project(saltybot_segmentation_costmap)
+
+# Default to C++17
+if(NOT CMAKE_CXX_STANDARD)
+  set(CMAKE_CXX_STANDARD 17)
+endif()
+
+if(CMAKE_COMPILER_IS_GNUCXX OR CMAKE_CXX_COMPILER_ID MATCHES "Clang")
+  add_compile_options(-Wall -Wextra -Wpedantic)
+endif()
+
+# ── Dependencies ──────────────────────────────────────────────────────────────
+find_package(ament_cmake REQUIRED)
+find_package(rclcpp REQUIRED)
+find_package(nav2_costmap_2d REQUIRED)
+find_package(nav_msgs REQUIRED)
+find_package(pluginlib REQUIRED)
+
+# ── Shared library (the plugin) ───────────────────────────────────────────────
+add_library(${PROJECT_NAME} SHARED
+  src/segmentation_costmap_layer.cpp
+)
+
+target_include_directories(${PROJECT_NAME} PUBLIC
+  $<BUILD_INTERFACE:${CMAKE_CURRENT_SOURCE_DIR}/include>
+  $<INSTALL_INTERFACE:include>
+)
+
+ament_target_dependencies(${PROJECT_NAME}
+  rclcpp
+  nav2_costmap_2d
+  nav_msgs
+  pluginlib
+)
+
+# Export plugin XML
+pluginlib_export_plugin_description_file(nav2_costmap_2d plugin.xml)
+
+# ── Install ───────────────────────────────────────────────────────────────────
+install(TARGETS ${PROJECT_NAME}
+  ARCHIVE DESTINATION lib
+  LIBRARY DESTINATION lib
+  RUNTIME DESTINATION bin
+)
+
+install(DIRECTORY include/
+  DESTINATION include
+)
+
+install(FILES plugin.xml
+  DESTINATION share/${PROJECT_NAME}
+)
+
+# ── Tests ─────────────────────────────────────────────────────────────────────
+if(BUILD_TESTING)
+  find_package(ament_lint_auto REQUIRED)
+  ament_lint_auto_find_test_dependencies()
+endif()
+
+ament_export_include_directories(include)
+ament_export_libraries(${PROJECT_NAME})
+ament_export_dependencies(
+  rclcpp
+  nav2_costmap_2d
+  nav_msgs
+  pluginlib
+)
+
+ament_package()
diff --git a/jetson/ros2_ws/src/saltybot_segmentation_costmap/include/saltybot_segmentation_costmap/segmentation_costmap_layer.hpp b/jetson/ros2_ws/src/saltybot_segmentation_costmap/include/saltybot_segmentation_costmap/segmentation_costmap_layer.hpp
new file mode 100644
index 0000000..4d1393c
--- /dev/null
+++ b/jetson/ros2_ws/src/saltybot_segmentation_costmap/include/saltybot_segmentation_costmap/segmentation_costmap_layer.hpp
@@ -0,0 +1,85 @@
+#pragma once
+
+#include <mutex>
+#include <string>
+
+#include "nav2_costmap_2d/layer.hpp"
+#include "nav2_costmap_2d/layered_costmap.hpp"
+#include "nav_msgs/msg/occupancy_grid.hpp"
+#include "rclcpp/rclcpp.hpp"
+
+namespace saltybot_segmentation_costmap
+{
+
+/**
+ * SegmentationCostmapLayer
+ *
+ * Nav2 costmap2d plugin that subscribes to /segmentation/costmap
+ * (nav_msgs/OccupancyGrid published by sidewalk_seg_node) and merges
+ * traversability costs into the Nav2 local_costmap.
+ *
+ * Merging strategy (combination_method parameter):
+ *   "max"      — keep the higher cost between existing and new (default, conservative)
+ *   "override" — always write the new cost, replacing existing
+ *   "min"      — keep the lower cost (permissive)
+ *
+ * Cost mapping from OccupancyGrid int8 to Nav2 costmap uint8:
+ *   -1   (unknown) → not written (cell unchanged)
+ *   0    (free)    → FREE_SPACE (0)
+ *   1–99 (cost)    → scaled to Nav2 range [1, INSCRIBED_INFLATED_OBSTACLE-1]
+ *   100  (lethal)  → LETHAL_OBSTACLE (254)
+ *
+ * Add to Nav2 local_costmap params:
+ *   local_costmap:
+ *     plugins: ["voxel_layer", "inflation_layer", "segmentation_layer"]
+ *     segmentation_layer:
+ *       plugin: "saltybot_segmentation_costmap::SegmentationCostmapLayer"
+ *       enabled: true
+ *       topic: /segmentation/costmap
+ *       combination_method: max
+ *       max_obstacle_distance: 0.0   (use all cells)
+ */
+class SegmentationCostmapLayer : public nav2_costmap_2d::Layer
+{
+public:
+  SegmentationCostmapLayer();
+  ~SegmentationCostmapLayer() override = default;
+
+  void onInitialize() override;
+  void updateBounds(
+    double robot_x, double robot_y, double robot_yaw,
+    double * min_x, double * min_y,
+    double * max_x, double * max_y) override;
+  void updateCosts(
+    nav2_costmap_2d::Costmap2D & master_grid,
+    int min_i, int min_j, int max_i, int max_j) override;
+
+  void reset() override;
+  bool isClearable() override { return true; }
+
+private:
+  void segCostmapCallback(const nav_msgs::msg::OccupancyGrid::SharedPtr msg);
+
+  /**
+   * Map OccupancyGrid int8 value to Nav2 costmap uint8 cost.
+   *   -1  → leave unchanged (return false)
+   *   0   → FREE_SPACE (0)
+   *   1–99 → 1 to INSCRIBED_INFLATED_OBSTACLE-1 (linear scale)
+   *   100 → LETHAL_OBSTACLE (254)
+   */
+  static bool occupancyToCost(int8_t occ, unsigned char & cost_out);
+
+  rclcpp::Subscription<nav_msgs::msg::OccupancyGrid>::SharedPtr sub_;
+  nav_msgs::msg::OccupancyGrid::SharedPtr latest_grid_;
+  std::mutex grid_mutex_;
+
+  std::string topic_;
+  std::string combination_method_;  // "max", "override", "min"
+  bool        enabled_;
+
+  // Track dirty bounds for updateBounds()
+  double last_min_x_, last_min_y_, last_max_x_, last_max_y_;
+  bool   need_update_;
+};
+
+}  // namespace saltybot_segmentation_costmap
diff --git a/jetson/ros2_ws/src/saltybot_segmentation_costmap/package.xml b/jetson/ros2_ws/src/saltybot_segmentation_costmap/package.xml
new file mode 100644
index 0000000..3e2b841
--- /dev/null
+++ b/jetson/ros2_ws/src/saltybot_segmentation_costmap/package.xml
@@ -0,0 +1,27 @@
+<?xml version="1.0"?>
+<?xml-model href="http://download.ros.org/schema/package_format3.xsd" schematypens="http://www.w3.org/2001/XMLSchema"?>
+<package format="3">
+  <name>saltybot_segmentation_costmap</name>
+  <version>0.1.0</version>
+  <description>
+    Nav2 costmap2d plugin: SegmentationCostmapLayer.
+    Merges semantic traversability scores from sidewalk_seg_node into
+    the Nav2 local_costmap — sidewalk free, road high-cost, obstacle lethal.
+  </description>
+  <maintainer email="seb@vayrette.com">seb</maintainer>
+  <license>MIT</license>
+
+  <buildtool_depend>ament_cmake</buildtool_depend>
+
+  <depend>rclcpp</depend>
+  <depend>nav2_costmap_2d</depend>
+  <depend>nav_msgs</depend>
+  <depend>pluginlib</depend>
+
+  <test_depend>ament_lint_auto</test_depend>
+  <test_depend>ament_lint_common</test_depend>
+
+  <export>
+    <build_type>ament_cmake</build_type>
+  </export>
+</package>
diff --git a/jetson/ros2_ws/src/saltybot_segmentation_costmap/plugin.xml b/jetson/ros2_ws/src/saltybot_segmentation_costmap/plugin.xml
new file mode 100644
index 0000000..886abe6
--- /dev/null
+++ b/jetson/ros2_ws/src/saltybot_segmentation_costmap/plugin.xml
@@ -0,0 +1,13 @@
+<library path="saltybot_segmentation_costmap">
+  <class
+    name="saltybot_segmentation_costmap::SegmentationCostmapLayer"
+    type="saltybot_segmentation_costmap::SegmentationCostmapLayer"
+    base_class_type="nav2_costmap_2d::Layer">
+    <description>
+      Nav2 costmap layer that merges semantic traversability scores from
+      /segmentation/costmap (published by sidewalk_seg_node) into the
+      Nav2 local_costmap. Roads are high-cost, obstacles are lethal,
+      sidewalks are free.
+    </description>
+  </class>
+</library>
diff --git a/jetson/ros2_ws/src/saltybot_segmentation_costmap/src/segmentation_costmap_layer.cpp b/jetson/ros2_ws/src/saltybot_segmentation_costmap/src/segmentation_costmap_layer.cpp
new file mode 100644
index 0000000..fe31b2e
--- /dev/null
+++ b/jetson/ros2_ws/src/saltybot_segmentation_costmap/src/segmentation_costmap_layer.cpp
@@ -0,0 +1,207 @@
+#include "saltybot_segmentation_costmap/segmentation_costmap_layer.hpp"
+
+#include <algorithm>
+#include <string>
+
+#include "nav2_costmap_2d/costmap_2d.hpp"
+#include "pluginlib/class_list_macros.hpp"
+
+PLUGINLIB_EXPORT_CLASS(
+  saltybot_segmentation_costmap::SegmentationCostmapLayer,
+  nav2_costmap_2d::Layer)
+
+namespace saltybot_segmentation_costmap
+{
+
+using nav2_costmap_2d::FREE_SPACE;
+using nav2_costmap_2d::LETHAL_OBSTACLE;
+using nav2_costmap_2d::INSCRIBED_INFLATED_OBSTACLE;
+using nav2_costmap_2d::NO_INFORMATION;
+
+SegmentationCostmapLayer::SegmentationCostmapLayer()
+: last_min_x_(-1e9), last_min_y_(-1e9),
+  last_max_x_(1e9),  last_max_y_(1e9),
+  need_update_(false)
+{}
+
+// ── onInitialize ─────────────────────────────────────────────────────────────
+
+void SegmentationCostmapLayer::onInitialize()
+{
+  auto node = node_.lock();
+  if (!node) {
+    throw std::runtime_error("SegmentationCostmapLayer: node handle expired");
+  }
+
+  declareParameter("enabled",            rclcpp::ParameterValue(true));
+  declareParameter("topic",              rclcpp::ParameterValue(std::string("/segmentation/costmap")));
+  declareParameter("combination_method", rclcpp::ParameterValue(std::string("max")));
+
+  enabled_            = node->get_parameter(name_ + "." + "enabled").as_bool();
+  topic_              = node->get_parameter(name_ + "." + "topic").as_string();
+  combination_method_ = node->get_parameter(name_ + "." + "combination_method").as_string();
+
+  RCLCPP_INFO(
+    node->get_logger(),
+    "SegmentationCostmapLayer: topic=%s method=%s",
+    topic_.c_str(), combination_method_.c_str());
+
+  // Transient local QoS to match the sidewalk_seg_node publisher
+  rclcpp::QoS qos(rclcpp::KeepLast(1));
+  qos.transient_local();
+  qos.reliable();
+
+  sub_ = node->create_subscription<nav_msgs::msg::OccupancyGrid>(
+    topic_, qos,
+    std::bind(
+      &SegmentationCostmapLayer::segCostmapCallback, this,
+      std::placeholders::_1));
+
+  current_ = true;
+}
+
+// ── Subscription callback ─────────────────────────────────────────────────────
+
+void SegmentationCostmapLayer::segCostmapCallback(
+  const nav_msgs::msg::OccupancyGrid::SharedPtr msg)
+{
+  std::lock_guard<std::mutex> lock(grid_mutex_);
+  latest_grid_ = msg;
+  need_update_ = true;
+}
+
+// ── updateBounds ──────────────────────────────────────────────────────────────
+
+void SegmentationCostmapLayer::updateBounds(
+  double /*robot_x*/, double /*robot_y*/, double /*robot_yaw*/,
+  double * min_x, double * min_y,
+  double * max_x, double * max_y)
+{
+  if (!enabled_) {return;}
+
+  std::lock_guard<std::mutex> lock(grid_mutex_);
+  if (!latest_grid_) {return;}
+
+  const auto & info = latest_grid_->info;
+  double ox = info.origin.position.x;
+  double oy = info.origin.position.y;
+  double gw = info.width  * info.resolution;
+  double gh = info.height * info.resolution;
+
+  last_min_x_ = ox;
+  last_min_y_ = oy;
+  last_max_x_ = ox + gw;
+  last_max_y_ = oy + gh;
+
+  *min_x = std::min(*min_x, last_min_x_);
+  *min_y = std::min(*min_y, last_min_y_);
+  *max_x = std::max(*max_x, last_max_x_);
+  *max_y = std::max(*max_y, last_max_y_);
+}
+
+// ── updateCosts ───────────────────────────────────────────────────────────────
+
+void SegmentationCostmapLayer::updateCosts(
+  nav2_costmap_2d::Costmap2D & master,
+  int min_i, int min_j, int max_i, int max_j)
+{
+  if (!enabled_) {return;}
+
+  std::lock_guard<std::mutex> lock(grid_mutex_);
+  if (!latest_grid_ || !need_update_) {return;}
+
+  const auto & info  = latest_grid_->info;
+  const auto & data  = latest_grid_->data;
+
+  float seg_res = info.resolution;
+  float seg_ox  = static_cast<float>(info.origin.position.x);
+  float seg_oy  = static_cast<float>(info.origin.position.y);
+  int   seg_w   = static_cast<int>(info.width);
+  int   seg_h   = static_cast<int>(info.height);
+
+  float master_res = static_cast<float>(master.getResolution());
+
+  // Iterate over the update window
+  for (int j = min_j; j < max_j; ++j) {
+    for (int i = min_i; i < max_i; ++i) {
+      // World coords of this master cell centre
+      double wx, wy;
+      master.mapToWorld(
+        static_cast<unsigned int>(i), static_cast<unsigned int>(j), wx, wy);
+
+      // Corresponding cell in segmentation grid
+      int seg_col = static_cast<int>((wx - seg_ox) / seg_res);
+      int seg_row = static_cast<int>((wy - seg_oy) / seg_res);
+
+      if (seg_col < 0 || seg_col >= seg_w ||
+          seg_row < 0 || seg_row >= seg_h) {
+        continue;
+      }
+
+      int seg_idx = seg_row * seg_w + seg_col;
+      if (seg_idx < 0 || seg_idx >= static_cast<int>(data.size())) {
+        continue;
+      }
+
+      int8_t occ = data[static_cast<size_t>(seg_idx)];
+      unsigned char new_cost = 0;
+      if (!occupancyToCost(occ, new_cost)) {
+        continue;  // unknown cell — leave master unchanged
+      }
+
+      unsigned char existing = master.getCost(
+        static_cast<unsigned int>(i), static_cast<unsigned int>(j));
+
+      unsigned char final_cost = existing;
+      if (combination_method_ == "override") {
+        final_cost = new_cost;
+      } else if (combination_method_ == "min") {
+        final_cost = std::min(existing, new_cost);
+      } else {
+        // "max" (default) — most conservative
+        final_cost = std::max(existing, new_cost);
+      }
+
+      master.setCost(
+        static_cast<unsigned int>(i), static_cast<unsigned int>(j),
+        final_cost);
+    }
+  }
+
+  need_update_ = false;
+}
+
+// ── reset ─────────────────────────────────────────────────────────────────────
+
+void SegmentationCostmapLayer::reset()
+{
+  std::lock_guard<std::mutex> lock(grid_mutex_);
+  latest_grid_.reset();
+  need_update_ = false;
+  current_ = true;
+}
+
+// ── occupancyToCost ───────────────────────────────────────────────────────────
+
+bool SegmentationCostmapLayer::occupancyToCost(int8_t occ, unsigned char & cost_out)
+{
+  if (occ < 0) {
+    return false;  // unknown — leave cell unchanged
+  }
+  if (occ == 0) {
+    cost_out = FREE_SPACE;
+    return true;
+  }
+  if (occ >= 100) {
+    cost_out = LETHAL_OBSTACLE;
+    return true;
+  }
+  // Scale 1–99 → 1 to (INSCRIBED_INFLATED_OBSTACLE-1) = 1 to 252
+  int scaled = 1 + static_cast<int>(
+    (occ - 1) * (INSCRIBED_INFLATED_OBSTACLE - 2) / 98.0f);
+  cost_out = static_cast<unsigned char>(
+    std::min(scaled, static_cast<int>(INSCRIBED_INFLATED_OBSTACLE - 1)));
+  return true;
+}
+
+}  // namespace saltybot_segmentation_costmap