From adaedd5556107277f7b733c2430e80195214649d Mon Sep 17 00:00:00 2001 From: Evan Mesterhazy Date: Sat, 2 Mar 2024 19:50:40 -0500 Subject: [PATCH] Add documentation to lib/src/index.rs and lib/src/default_index/ --- lib/src/default_index/composite.rs | 34 +++++++++++++-------- lib/src/default_index/mod.rs | 7 +++++ lib/src/index.rs | 48 ++++++++++++++++++++++++++---- 3 files changed, 70 insertions(+), 19 deletions(-) diff --git a/lib/src/default_index/composite.rs b/lib/src/default_index/composite.rs index a54482917..40ae4e85a 100644 --- a/lib/src/default_index/composite.rs +++ b/lib/src/default_index/composite.rs @@ -98,7 +98,13 @@ impl AsCompositeIndex for &mut T { } } -/// Reference wrapper that provides global access to nested index segments. +/// `CompositeIndex` provides an index of both commit IDs and change IDs. +/// +/// We refer to this as a composite index because it's a composite of multiple +/// nested index segments where each parent segment is roughly twice as large +/// its child. segment. This provides a good balance between read and write +/// performance. +// Reference wrapper that provides global access to nested index segments. #[derive(RefCastCustom)] #[repr(transparent)] pub struct CompositeIndex(DynIndexSegment); @@ -355,6 +361,8 @@ impl CompositeIndex { .map(|(i, _)| IndexPosition(u32::try_from(i).unwrap())) } + /// Returns the subset of positions in `candidate_positions` which refer to + /// entries that are heads in the repository. pub fn heads_pos( &self, mut candidate_positions: BTreeSet, @@ -475,7 +483,6 @@ impl Index for &CompositeIndex { .collect() } - /// Parents before children fn topo_order(&self, input: &mut dyn Iterator) -> Vec { let mut ids = input.cloned().collect_vec(); ids.sort_by_cached_key(|id| self.commit_id_to_pos(id).unwrap()); @@ -511,12 +518,12 @@ impl ChangeIdIndexImpl { } impl ChangeIdIndex for ChangeIdIndexImpl { - /// Resolves change id prefix among all ids, then filters out hidden - /// entries. - /// - /// If `SingleMatch` is returned, the commits including in the set are all - /// visible. `AmbiguousMatch` may be returned even if the prefix is unique - /// within the visible entries. + // Resolves change id prefix among all ids, then filters out hidden + // entries. + // + // If `SingleMatch` is returned, the commits including in the set are all + // visible. `AmbiguousMatch` may be returned even if the prefix is unique + // within the visible entries. fn resolve_prefix(&self, prefix: &HexPrefix) -> PrefixResolution> { let index = self.index.as_composite(); match index.resolve_change_id_prefix(prefix) { @@ -540,11 +547,12 @@ impl ChangeIdIndex for ChangeIdIndexImpl { } } - /// Calculates the shortest prefix length of the given `change_id` among all - /// ids including hidden entries. - /// - /// The returned length is usually a few digits longer than the minimum - /// length to disambiguate within the visible entries. + // Calculates the shortest prefix length of the given `change_id` among all + // IDs, including hidden entries. + // + // The returned length is usually a few digits longer than the minimum + // length necessary to disambiguate within the visible entries since hidden + // entries are also considered when determining the prefix length. fn shortest_unique_prefix_len(&self, change_id: &ChangeId) -> usize { self.index .as_composite() diff --git a/lib/src/default_index/mod.rs b/lib/src/default_index/mod.rs index c85e40430..6e52d99d1 100644 --- a/lib/src/default_index/mod.rs +++ b/lib/src/default_index/mod.rs @@ -12,6 +12,13 @@ // See the License for the specific language governing permissions and // limitations under the License. +//! An on-disk index of the commits in a repository. +//! +//! Implements an index of the commits in a repository that conforms to the +//! trains in the [index module](crate::index). The index is stored on local +//! disk and contains an entry for every commit in the repository. See +//! [`DefaultReadonlyIndex`] and [`DefaultMutableIndex`]. + #![allow(missing_docs)] mod composite; diff --git a/lib/src/index.rs b/lib/src/index.rs index 28dc6d9e4..cc00e9b8a 100644 --- a/lib/src/index.rs +++ b/lib/src/index.rs @@ -12,7 +12,7 @@ // See the License for the specific language governing permissions and // limitations under the License. -#![allow(missing_docs)] +//! Interfaces for indexes of the commits in a repository. use std::any::Any; use std::fmt::Debug; @@ -28,33 +28,42 @@ use crate::operation::Operation; use crate::revset::{ResolvedExpression, Revset, RevsetEvaluationError}; use crate::store::Store; -/// Error while reading index from the `IndexStore`. +/// Returned if an error occurs while reading an index from the [`IndexStore`]. #[derive(Debug, Error)] #[error(transparent)] pub struct IndexReadError(pub Box); -/// Error while writing index to the `IndexStore`. +/// Returned if an error occurs while writing an index to the [`IndexStore`]. #[derive(Debug, Error)] #[error(transparent)] pub struct IndexWriteError(pub Box); -/// Error to be returned if `Index::all_heads_for_gc()` is not supported by the +/// An error returned if `Index::all_heads_for_gc()` is not supported by the /// index backend. #[derive(Debug, Error)] #[error("Cannot collect all heads by index of this type")] pub struct AllHeadsForGcUnsupported; +/// Defines the interface for types that provide persistent storage for an +/// index. pub trait IndexStore: Send + Sync + Debug { + #[allow(missing_docs)] fn as_any(&self) -> &dyn Any; + /// Returns a name representing the type of index that the `IndexStore` is + /// compatible with. For example, the `IndexStore` for the default index + /// returns "default". fn name(&self) -> &str; + /// Returns the index at the specified operation. fn get_index_at_op( &self, op: &Operation, store: &Arc, ) -> Result, IndexReadError>; + /// Writes `index` to the index store and returns a read-only version of the + /// index. fn write_index( &self, index: Box, @@ -62,15 +71,32 @@ pub trait IndexStore: Send + Sync + Debug { ) -> Result, IndexWriteError>; } +/// Defines the interface for types that provide an index of the commits in a +/// repository by [`CommitId`]. pub trait Index: Send + Sync { + /// Returns the minimum prefix length to disambiguate `commit_id` from other + /// commits in the index. The length returned is the number of hexadecimal + /// digits in the minimum prefix. + /// + /// If the given `commit_id` doesn't exist, returns the minimum prefix + /// length which matches none of the commits in the index. fn shortest_unique_commit_id_prefix_len(&self, commit_id: &CommitId) -> usize; + /// Searches the index for commit IDs matching `prefix`. Returns a + /// [`PrefixResolution`] with a [`CommitId`] if the prefix matches a single + /// commit. fn resolve_commit_id_prefix(&self, prefix: &HexPrefix) -> PrefixResolution; + /// Returns true if `commit_id` is present in the index. fn has_id(&self, commit_id: &CommitId) -> bool; + /// Returns true if `ancestor_id` commit is an ancestor of the + /// `descendant_id` commit, or if `ancestor_id` equals `descendant_id`. fn is_ancestor(&self, ancestor_id: &CommitId, descendant_id: &CommitId) -> bool; + /// Returns the best common ancestor or ancestors of the commits in `set1` + /// and `set2`. A "best common ancestor" has no descendants that are also + /// common ancestors. fn common_ancestors(&self, set1: &[CommitId], set2: &[CommitId]) -> Vec; /// Heads among all indexed commits at the associated operation. @@ -85,11 +111,17 @@ pub trait Index: Send + Sync { &self, ) -> Result + '_>, AllHeadsForGcUnsupported>; + /// Returns the subset of commit IDs in `candidates` which are not ancestors + /// of other commits in `candidates`. If a commit id is duplicated in the + /// `candidates` list it will appear at most once in the output. fn heads(&self, candidates: &mut dyn Iterator) -> Vec; - /// Parents before children + /// Orders a list of commit IDs such that parent commits appear before any + /// of their children. Commit IDs in the `input` are not deduplicated. fn topo_order(&self, input: &mut dyn Iterator) -> Vec; + /// Resolves the revset `expression` against the index and corresponding + /// `store`. fn evaluate_revset<'index>( &'index self, expression: &ResolvedExpression, @@ -97,6 +129,7 @@ pub trait Index: Send + Sync { ) -> Result, RevsetEvaluationError>; } +#[allow(missing_docs)] pub trait ReadonlyIndex: Send + Sync { fn as_any(&self) -> &dyn Any; @@ -108,6 +141,7 @@ pub trait ReadonlyIndex: Send + Sync { fn start_modification(&self) -> Box; } +#[allow(missing_docs)] pub trait MutableIndex { fn as_any(&self) -> &dyn Any; @@ -125,6 +159,8 @@ pub trait MutableIndex { fn merge_in(&mut self, other: &dyn ReadonlyIndex); } +/// Defines the interface for types that provide an index of the commits in a +/// repository by [`ChangeId`]. pub trait ChangeIdIndex: Send + Sync { /// Resolve an unambiguous change ID prefix to the commit IDs in the index. /// @@ -134,7 +170,7 @@ pub trait ChangeIdIndex: Send + Sync { /// This function returns the shortest length of a prefix of `key` that /// disambiguates it from every other key in the index. /// - /// The length to be returned is a number of hexadecimal digits. + /// The length returned is a number of hexadecimal digits. /// /// This has some properties that we do not currently make much use of: ///