gitignore: ignore perf.data* profiling files

shisoft · shisoft · commit 440fe0aa3ba5 · 2025-09-23T04:20:01.000Z
diff --git a/.gitignore b/.gitignore
@@ -118,4 +118,6 @@ Cargo.lock
 # These are backup files generated by rustfmt
 **/*.rs.bk
 
-.idea
+.idea
+# Ignore perf profiling data
+perf.data*
diff --git a/src/apps/hnsw/coordinator/mod.rs b/src/apps/hnsw/coordinator/mod.rs
@@ -133,10 +133,11 @@ impl Service for HNSWIndexService {
                 )
                 .await
                 .map_err(|e| format!("Failed to create new job (RPC): {:?}", e))??;
-            cell_client
-                .next_iteration(false, job_id)
+            // Advance from initial starting vertices using combined RPC
+            let _ = cell_client
+                .advance_iteration(job_id, Vec::new(), false)
                 .await
-                .map_err(|e| format!("Failed to navigate to closest (RPC): {:?}", e))??;
+                .map_err(|e| format!("Failed to navigate to closest (RPC): {:?}", e))?;
             cell_client
                 .index_cell(job_id, cell_id)
                 .await
@@ -159,16 +160,30 @@ impl Service for HNSWIndexService {
         async move {
             self.broadcast_new_job(job_id, schema, field_id, query, 1, ef, ef, metric)
                 .await?;
-            self.broadcast_navigate_to_closest(job_id, max_iter as usize)
+            let participants = self
+                .broadcast_navigate_to_closest(job_id, max_iter as usize)
                 .await?;
-            let tops = broadcast_to_members(
-                &self.conshash,
-                move |partition_svr: Arc<PartitionSvrClient>| async move {
-                    partition_svr.top(job_id).await
-                },
-            )
-            .await
-            .map_err(|e| format!("Failed to get top result: {:?}", e))?;
+            let tops = if participants.is_empty() {
+                broadcast_to_members(
+                    &self.conshash,
+                    move |partition_svr: Arc<PartitionSvrClient>| async move {
+                        partition_svr.top(job_id).await
+                    },
+                )
+                .await
+                .map_err(|e| format!("Failed to get top result: {:?}", e))?
+            } else {
+                let server_ids = participants.into_iter().sorted().collect_vec();
+                broadcast_with_server_ids(
+                    server_ids.into_iter(),
+                    &self.conshash,
+                    move |partition_svr: Arc<PartitionSvrClient>| async move {
+                        partition_svr.top(job_id).await
+                    },
+                )
+                .await
+                .map_err(|e| format!("Failed to get top result: {:?}", e))?
+            };
             let top = tops
                 .iter()
                 .filter_map(|(sid, res)| {
@@ -206,16 +221,30 @@ impl Service for HNSWIndexService {
         async move {
             self.broadcast_new_job(job_id, schema, field_id, query, k as u64, ef, ef, metric)
                 .await?;
-            self.broadcast_navigate_to_closest(job_id, max_iter as usize)
+            let participants = self
+                .broadcast_navigate_to_closest(job_id, max_iter as usize)
                 .await?;
-            let tops = broadcast_to_members(
-                &self.conshash,
-                move |partition_svr: Arc<PartitionSvrClient>| async move {
-                    partition_svr.top_k(job_id, k as u32).await
-                },
-            )
-            .await
-            .map_err(|e| format!("Failed to get top result: {:?}", e))?;
+            let tops = if participants.is_empty() {
+                broadcast_to_members(
+                    &self.conshash,
+                    move |partition_svr: Arc<PartitionSvrClient>| async move {
+                        partition_svr.top_k(job_id, k as u32).await
+                    },
+                )
+                .await
+                .map_err(|e| format!("Failed to get top result: {:?}", e))?
+            } else {
+                let server_ids = participants.into_iter().sorted().collect_vec();
+                broadcast_with_server_ids(
+                    server_ids.into_iter(),
+                    &self.conshash,
+                    move |partition_svr: Arc<PartitionSvrClient>| async move {
+                        partition_svr.top_k(job_id, k as u32).await
+                    },
+                )
+                .await
+                .map_err(|e| format!("Failed to get top result: {:?}", e))?
+            };
             let top_k = tops
                 .iter()
                 .filter_map(|(sid, res)| {
@@ -382,14 +411,15 @@ impl HNSWIndexService {
         &self,
         job_id: JobId,
         max_iter: usize,
-    ) -> Result<(), String> {
+    ) -> Result<HashSet<u64>, String> {
+        let mut participants: HashSet<u64> = HashSet::default();
         let mut new_frontiers = self.broadcast_all_next_iteration(job_id, false).await?;
         let mut iter = 1;
         while !new_frontiers.is_empty() {
             if iter >= max_iter {
                 // reached max iterations, just stop there
                 // TODO: maybe we should consider repartition the graph when this happens
-                return Ok(());
+                return Ok(participants);
             }
             iter += 1;
             let server_frontiers = new_frontiers
@@ -402,22 +432,17 @@ impl HNSWIndexService {
                 .collect::<HashMap<_, _>>();
             let frontiers = Arc::new(server_frontiers);
             let server_ids = frontiers.keys().cloned().collect_vec();
+            participants.extend(server_ids.iter().cloned());
             let broadcast_res = broadcast_with_server_ids(
                 server_ids.into_iter(),
                 &self.conshash,
                 move |partition_svr: Arc<PartitionSvrClient>| {
                     let frontiers = frontiers.clone();
                     async move {
                         let ids = frontiers.get(&partition_svr.server_id()).unwrap();
-                        let set_res = partition_svr.set_frontiers(job_id, ids.clone()).await?;
-                        if let Err(e) = &set_res {
-                            return Ok(Err(format!(
-                                "Failed to set frontiers on {}: {:?}",
-                                partition_svr.server_id(),
-                                e
-                            )));
-                        }
-                        let new_frontier = partition_svr.next_iteration(false, job_id).await?;
+                        let new_frontier = partition_svr
+                            .advance_iteration(job_id, ids.clone(), false)
+                            .await?;
                         Ok(new_frontier)
                     }
                 },
@@ -445,7 +470,7 @@ impl HNSWIndexService {
                 }
             }
         }
-        Ok(())
+        Ok(participants)
     }
 
     async fn broadcast_next_iteration<I>(
@@ -457,12 +482,16 @@ impl HNSWIndexService {
     where
         I: Iterator<Item = u64>,
     {
+        // With advance_iteration, there is no separate next_iteration without frontiers.
+        // So we call it with empty frontiers to drive local iteration.
+        let empty: Vec<Id> = Vec::new();
         let next_iteration_res = broadcast_with_server_ids(
             server_ids.into_iter(),
             &self.conshash,
             move |partition_svr: Arc<PartitionSvrClient>| {
                 let job_id = job_id.clone();
-                async move { partition_svr.next_iteration(readonly, job_id).await }
+                let empty_clone = empty.clone();
+                async move { partition_svr.advance_iteration(job_id, empty_clone, readonly).await }
             },
         )
         .await
diff --git a/src/apps/hnsw/partition/search.rs b/src/apps/hnsw/partition/search.rs
@@ -454,28 +454,30 @@ impl HnswOnlinePartition {
                         vec![]
                     }
                     Err(NeighbourhoodError::IdListError(IdListError::ContainerCellNotReady)) => {
-                        // If the container cell is not ready, we need to prepare the it
-                        append_job_log(
-                            logger,
-                            job_id,
-                            JobLogLevel::Info,
-                            format!("Container cell not ready for vertex {:?}, preparing it", id),
-                        );
-                        let field_id = ed.as_field();
-                        let _ = engine
-                            .graph_transaction(DefaultPartitioner, move |txn| {
-                                let mut list = IdList::from_txn_and_container(
-                                    &txn.neb_txn,
-                                    *id,
-                                    field_id,
-                                    schema_id,
-                                );
-                                async move {
-                                    list.ensure_list().await;
-                                    Ok(())
-                                }
-                            })
-                            .await;
+                        // Respect readonly: do not perform writes during query navigation
+                        if !readonly {
+                            append_job_log(
+                                logger,
+                                job_id,
+                                JobLogLevel::Info,
+                                format!("Container cell not ready for vertex {:?}, preparing it", id),
+                            );
+                            let field_id = ed.as_field();
+                            let _ = engine
+                                .graph_transaction(DefaultPartitioner, move |txn| {
+                                    let mut list = IdList::from_txn_and_container(
+                                        &txn.neb_txn,
+                                        *id,
+                                        field_id,
+                                        schema_id,
+                                    );
+                                    async move {
+                                        list.ensure_list().await;
+                                        Ok(())
+                                    }
+                                })
+                                .await;
+                        }
                         vec![]
                     }
                     Err(e) => {
diff --git a/src/apps/hnsw/partition/service.rs b/src/apps/hnsw/partition/service.rs
@@ -47,9 +47,9 @@ pub mod service {
         rpc end_job(job_id: JobId) -> bool;
 
         // Then use multiple iterations (or not) to do the actual search
-        // It returns remove frontiers to be processed by other partitions
-        rpc next_iteration(readonly: bool, job_id: JobId) -> Result<HashSet<Id>, String>;
-        rpc set_frontiers(job_id: JobId, frontiers: Vec<Id>) -> Result<(), String>;
+        // It returns remote frontiers to be processed by other partitions
+        // Combined RPC to reduce per-iteration round-trips: set frontiers and advance one iteration
+        rpc advance_iteration(job_id: JobId, frontiers: Vec<Id>, readonly: bool) -> Result<HashSet<Id>, String>;
 
         // After a search is completed, it can call following functions
         rpc index_cell(job_id: JobId, cell_id: Id) -> Result<(), String>;
@@ -158,34 +158,13 @@ impl service::Service for service::HNSWPartitionService {
         .boxed()
     }
 
-    fn set_frontiers<'a>(
+    
+
+    fn advance_iteration<'a>(
         &'a self,
         job_id: JobId,
         frontiers: Vec<Id>,
-    ) -> BoxFuture<'a, Result<(), String>> {
-        async move {
-            let job = match self
-                .jobs
-                .get(&job_id)
-                .ok_or(format!("Job {:?} not found", job_id))
-            {
-                Ok(job) => job,
-                Err(msg) => {
-                    append_job_log(&self.job_logger, job_id, JobLogLevel::Error, msg.clone());
-                    return Err(msg);
-                }
-            };
-            let mut job = job.lock().await;
-            job.frontier = frontiers;
-            Ok(())
-        }
-        .boxed()
-    }
-
-    fn next_iteration<'a>(
-        &'a self,
         readonly: bool,
-        job_id: JobId,
     ) -> BoxFuture<'a, Result<HashSet<Id>, String>> {
         async move {
             let job = match self
@@ -199,6 +178,14 @@ impl service::Service for service::HNSWPartitionService {
                     return Err(msg);
                 }
             };
+            // Set incoming frontiers if provided; otherwise preserve current frontier
+            {
+                let mut job = job.lock().await;
+                if !frontiers.is_empty() {
+                    job.frontier = frontiers;
+                }
+            }
+            // Now run next_iteration with the provided readonly flag
             let mut job = job.lock().await;
             let metric = Metric::from_encoding(job.metric);
             let logger = &self.job_logger;
@@ -240,6 +227,8 @@ impl service::Service for service::HNSWPartitionService {
         .boxed()
     }
 
+    
+
     fn index_cell<'a>(&'a self, job_id: JobId, cell_id: Id) -> BoxFuture<'a, Result<(), String>> {
         async move {
             self.new_vertex(job_id, cell_id)
diff --git a/src/apps/hnsw/partition/tests.rs b/src/apps/hnsw/partition/tests.rs
@@ -235,8 +235,8 @@ impl TestEnvironment {
                 )
                 .await
                 .map_err(|e| format!("Failed to create job: {:?}", e))?;
-            partition_svr
-                .next_iteration(false, job_id)
+            let _ = partition_svr
+                .advance_iteration(job_id, Vec::new(), false)
                 .await
                 .map_err(|e| format!("Failed to run job with next iteration: {:?}", e))?;
             partition_svr
@@ -246,7 +246,7 @@ impl TestEnvironment {
             // let mut search = partition.new_search(CELL_SCHEMA_ID, VECTOR_FIELD_ID, &vector, 1, MetricEncoding::L2)
             //     .await
             //     .map_err(|e| format!("Failed to create search: {:?}", e))?;
-            // partition.next_iteration(&mut search, L2Metric, logger, job_id).await.map_err(|e| format!("Failed to run search iteration: {:?}", e))?;
+            // (legacy) partition.next_iteration(&mut search, ...)
             // partition.new_vertex(job_id, cell_id, &vector, CELL_SCHEMA_ID, VECTOR_FIELD_ID, L2Metric, SearchMetadata::default(), 3, logger).await.map_err(|e| format!("Failed to create vertex: {:?}", e))?;
         }
         Ok(())
@@ -276,16 +276,16 @@ impl TestEnvironment {
             )
             .await
             .map_err(|e| format!("Failed to create job: {:?}", e))?;
-        partition
-            .next_iteration(false, job_id)
+        let _ = partition
+            .advance_iteration(job_id, Vec::new(), false)
             .await
             .map_err(|e| format!("Failed to run job with next iteration: {:?}", e))?;
         let results = partition
             .top_k(job_id, k as u32)
             .await
             .map_err(|e| format!("Failed to search: {:?}", e))?;
         let duration = start.elapsed();
-        println!("Search took {:?} microseconds", duration.as_micros());
+        println!("Search took {:?} ms", duration.as_millis());
         Ok(results)
     }