geosensing
diff --git a/‎README.md‎
Lines changed: 56 additions & 26 deletions b/‎README.md‎
Lines changed: 56 additions & 26 deletions
diff --git a/‎allocator/__init__.py‎
Lines changed: 5 additions & 0 deletions b/‎allocator/__init__.py‎
Lines changed: 5 additions & 0 deletions
diff --git a/‎allocator/api/__init__.py‎
Lines changed: 12 additions & 1 deletion b/‎allocator/api/__init__.py‎
Lines changed: 12 additions & 1 deletion
diff --git a/‎allocator/api/random_walk.py‎
Lines changed: 139 additions & 0 deletions b/‎allocator/api/random_walk.py‎
Lines changed: 139 additions & 0 deletions
diff --git a/‎allocator/api/types.py‎
Lines changed: 9 additions & 0 deletions b/‎allocator/api/types.py‎
Lines changed: 9 additions & 0 deletions
diff --git a/‎allocator/cli/main.py‎
Lines changed: 2 additions & 0 deletions b/‎allocator/cli/main.py‎
Lines changed: 2 additions & 0 deletions
@@ -1,57 +1,87 @@
-# allocator: Efficiently collect data from geographically distributed locations
+# allocator
 
 [![PyPI version](https://img.shields.io/pypi/v/allocator.svg)](https://pypi.python.org/pypi/allocator)
 [![Downloads](https://pepy.tech/badge/allocator)](https://pepy.tech/project/allocator)
 [![CI](https://github.com/geosensing/allocator/actions/workflows/ci.yml/badge.svg)](https://github.com/geosensing/allocator/actions/workflows/ci.yml)
 [![Documentation](https://img.shields.io/badge/docs-github.io-blue)](https://geosensing.github.io/allocator/)
 
-**Allocator** provides a modern, Pythonic API for geographic task allocation, clustering, and routing optimization.
+Field teams, delivery services, and survey organizations waste time and money on inefficient routes. When you have 100+ locations to visit, manual planning fails. Allocator solves this.
 
-## Key Features
+## What It Does
 
-- **🎯 Clustering**: Group geographic points into balanced zones
-- **🛣️ Routing**: Find optimal paths through locations (TSP solving)  
-- **📍 Assignment**: Connect points to closest workers/centers
-- **🚀 Performance**: Optimized algorithms with NumPy and scikit-learn
-- **📦 Modern API**: Clean Python interface + unified CLI
+- **Cluster**: Divide locations into balanced work zones
+- **Route**: Find the shortest path through locations (TSP)
+- **Assign**: Match locations to nearest workers or depots
+- **Random Walk**: Generate survey itineraries on road networks
 
-## Quick Start
+## Install
 
 ```bash
 pip install allocator
 ```
 
+## Python API
+
+### Cluster locations into zones
+
 ```python
 import allocator
 import pandas as pd
 
-# Geographic locations
 locations = pd.DataFrame({
-    'longitude': [100.5018, 100.5065, 100.5108],
-    'latitude': [13.7563, 13.7590, 13.7633]
+    'longitude': [100.501, 100.506, 100.510, 100.515, 100.520],
+    'latitude': [13.756, 13.759, 13.763, 13.768, 13.772]
 })
 
-# Group into zones
-clusters = allocator.cluster(locations, n_clusters=2)
+result = allocator.cluster(locations, n_clusters=2)
+print(result.labels)  # [0 0 0 1 1]
+```
+
+### Find shortest route
+
+```python
+route = allocator.shortest_path(locations, method='ortools')
+print(route.route)  # [0, 1, 2, 4, 3, 0]
+```
 
-# Find optimal route
-route = allocator.shortest_path(locations)
+### Assign to nearest depot
 
-# Assign to service centers
-centers = pd.DataFrame({
+```python
+depots = pd.DataFrame({
     'longitude': [100.50, 100.52],
     'latitude': [13.75, 13.77]
 })
-assignments = allocator.assign(locations, centers)
+
+assignments = allocator.assign_to_closest(locations, depots)
+print(assignments.data['assigned_worker'].tolist())  # [0, 0, 1, 1, 1]
+```
+
+### Generate random walk itineraries
+
+```python
+import networkx as nx
+
+# Load road network graph (from OSMnx or similar)
+G = nx.read_graphml("road_network.graphml")
+
+result = allocator.random_walk(G, n_walks=10, walk_length_m=5000)
+print(result.data)  # DataFrame with waypoints
+```
+
+## CLI
+
+```bash
+allocator cluster kmeans locations.csv -n 5 -o zones.csv
+allocator route tsp locations.csv --method ortools -o route.csv
+allocator sort locations.csv --workers depots.csv -o assignments.csv
+allocator random-walk road_network.graphml -n 10 -l 5000 -o waypoints.csv
 ```
 
-## Documentation & Examples
+## Documentation
 
-- **📖 [Full Documentation](https://geosensing.github.io/allocator/)**
-- **🚀 [Installation & Tutorial](https://geosensing.github.io/allocator/quickstart.html)**  
-- **🔧 [API Reference](https://geosensing.github.io/allocator/api/clustering.html)**
-- **💡 [Real-World Examples](https://geosensing.github.io/allocator/examples/overview.html)**
+- [Full Documentation](https://geosensing.github.io/allocator/)
+- [API Reference](https://geosensing.github.io/allocator/api/clustering.html)
 
-## License & Contributing
+## License
 
-MIT License. Contributions welcome - see [Contributing Guide](https://geosensing.github.io/allocator/contributing.html).
+MIT
@@ -44,13 +44,15 @@
     ClusterResult,
     ComparisonResult,
     ItineraryResult,
+    RandomWalkResult,
     RouteResult,
     SortResult,
     assign_to_closest,
     cluster,
     create_itineraries,
     distance_assignment,
     kmeans,
+    random_walk,
     shortest_path,
     sort_by_distance,
     tsp_christofides,
@@ -76,6 +78,7 @@
     "ClusterResult",
     "ComparisonResult",
     "ItineraryResult",
+    "RandomWalkResult",
     "RouteResult",
     "SortResult",
     # Main functions
@@ -98,6 +101,8 @@
     "plot_clusters",
     "plot_comparison",
     "plot_route",
+    # Random walk
+    "random_walk",
     # Logging utilities
     "setup_logging",
     "shortest_path",
 
@@ -7,14 +7,23 @@
 from .cluster import cluster, kmeans
 from .distance import assign_to_closest, distance_assignment, sort_by_distance
 from .itinerary import create_itineraries
+from .random_walk import random_walk
 from .route import shortest_path, tsp_christofides, tsp_google, tsp_ortools, tsp_osrm
-from .types import ClusterResult, ComparisonResult, ItineraryResult, RouteResult, SortResult
+from .types import (
+    ClusterResult,
+    ComparisonResult,
+    ItineraryResult,
+    RandomWalkResult,
+    RouteResult,
+    SortResult,
+)
 
 __all__ = [
     # Result types
     "ClusterResult",
     "ComparisonResult",
     "ItineraryResult",
+    "RandomWalkResult",
     "RouteResult",
     "SortResult",
     # Distance assignment methods
@@ -25,6 +34,8 @@
     "distance_assignment",
     # Specific clustering methods
     "kmeans",
+    # Random walk
+    "random_walk",
     "shortest_path",
     "sort_by_distance",
     # Specific routing methods
 
@@ -0,0 +1,139 @@
+"""
+API for random walk itinerary generation on road networks.
+"""
+
+from typing import Any
+
+import networkx as nx
+import numpy as np
+import pandas as pd
+
+from ..core.random_walk import (
+    generate_walks,
+    get_largest_connected_component,
+    validate_graph,
+)
+from .types import RandomWalkResult
+
+
+def random_walk(
+    graph: nx.Graph,
+    n_walks: int = 15,
+    walk_length_m: float = 5000.0,
+    start_points: list[Any] | None = None,
+    seed: int | None = None,
+    use_largest_component: bool = True,
+) -> RandomWalkResult:
+    """
+    Generate self-weighting random walk itineraries on a road network graph.
+
+    Random walks on road networks have a self-weighting property: at each
+    intersection of degree d, choosing the next edge uniformly (probability 1/d)
+    ensures that the time-average along the walk converges to a length-weighted
+    spatial average. This eliminates the need for explicit inclusion probabilities.
+
+    Args:
+        graph: NetworkX graph from OSMnx or geo-sampling. Must have:
+            - Node attributes: x/y, lon/lat, or longitude/latitude
+            - Edge attributes: length (in meters)
+        n_walks: Number of independent walks to generate (default 15)
+        walk_length_m: Target length of each walk in meters (default 5000.0)
+        start_points: Optional list of starting node IDs. If provided, walks
+            cycle through these points (useful for GRTS-selected starting locations).
+            If None, random nodes are chosen uniformly.
+        seed: Random seed for reproducibility
+        use_largest_component: If True (default), use only the largest connected
+            component of the graph to avoid getting stuck in disconnected regions.
+
+    Returns:
+        RandomWalkResult containing:
+            - walks: List of walk dicts, each with:
+                - waypoints: List of (lon, lat, cumulative_distance_m) tuples
+                - edges_traversed: List of (from_node, to_node, length_m) tuples
+                - total_distance_m: Actual distance walked
+            - data: DataFrame with all waypoints:
+                - walk_id: Walk index
+                - sequence: Waypoint sequence number within walk
+                - longitude: Waypoint longitude
+                - latitude: Waypoint latitude
+                - cumulative_distance_m: Distance from walk start
+            - metadata: Dict with:
+                - n_walks: Number of walks generated
+                - walk_length_m: Target walk length
+                - total_network_length_m: Sum of all edge lengths
+                - n_nodes: Number of nodes in graph
+                - n_edges: Number of edges in graph
+                - seed: Random seed used
+                - avg_actual_distance_m: Mean actual walk distance
+                - start_points_provided: Whether start_points was provided
+
+    Raises:
+        ValueError: If graph has no valid nodes or edges
+
+    Example:
+        >>> import networkx as nx
+        >>> import allocator
+        >>>
+        >>> # Create a simple test graph
+        >>> G = nx.Graph()
+        >>> G.add_node(0, longitude=100.0, latitude=13.0)
+        >>> G.add_node(1, longitude=100.1, latitude=13.0)
+        >>> G.add_edge(0, 1, length=1000.0)
+        >>>
+        >>> result = allocator.random_walk(G, n_walks=5, walk_length_m=500.0, seed=42)
+        >>> len(result.walks)
+        5
+    """
+    validation = validate_graph(graph)
+    if not validation["valid"]:
+        raise ValueError(f"Invalid graph: {'; '.join(validation['errors'])}")
+
+    working_graph = graph
+    if use_largest_component:
+        working_graph = get_largest_connected_component(graph)
+        if working_graph.number_of_nodes() < graph.number_of_nodes():
+            validation = validate_graph(working_graph)
+
+    rng = np.random.default_rng(seed)
+
+    walks = generate_walks(
+        working_graph,
+        n_walks=n_walks,
+        walk_length_m=walk_length_m,
+        start_points=start_points,
+        rng=rng,
+    )
+
+    rows = []
+    for walk_id, walk in enumerate(walks):
+        for seq, (lon, lat, cum_dist) in enumerate(walk["waypoints"]):
+            rows.append(
+                {
+                    "walk_id": walk_id,
+                    "sequence": seq,
+                    "longitude": lon,
+                    "latitude": lat,
+                    "cumulative_distance_m": cum_dist,
+                }
+            )
+
+    data = pd.DataFrame(rows)
+
+    actual_distances = [w["total_distance_m"] for w in walks]
+
+    metadata = {
+        "n_walks": len(walks),
+        "walk_length_m": walk_length_m,
+        "total_network_length_m": validation["total_network_length_m"],
+        "n_nodes": validation["n_nodes"],
+        "n_edges": validation["n_edges"],
+        "seed": seed,
+        "avg_actual_distance_m": float(np.mean(actual_distances)) if walks else 0.0,
+        "start_points_provided": start_points is not None,
+    }
+
+    return RandomWalkResult(
+        walks=walks,
+        data=data,
+        metadata=metadata,
+    )
@@ -62,3 +62,12 @@ class ItineraryResult:
     distances: list[float]
     data: pd.DataFrame
     metadata: dict[str, Any]
+
+
+@dataclass
+class RandomWalkResult:
+    """Result of random walk itinerary generation on road networks."""
+
+    walks: list[dict[str, Any]]
+    data: pd.DataFrame
+    metadata: dict[str, Any]
@@ -11,6 +11,7 @@
 from .. import __version__
 from .cluster_cmd import kmeans
 from .itinerary_cmd import itinerary
+from .random_walk_cmd import random_walk_cmd
 from .route_cmd import christofides, ortools, tsp
 
 console = Console()
@@ -53,6 +54,7 @@ def route() -> None:
 route.add_command(christofides)
 route.add_command(ortools)
 cli.add_command(itinerary)
+cli.add_command(random_walk_cmd, name="random-walk")
 
 
 @cli.command()