gix_odb/store_impls/dynamic/
load_index.rs

1use std::{
2    collections::{BTreeMap, VecDeque},
3    ffi::OsStr,
4    ops::Deref,
5    path::{Path, PathBuf},
6    sync::{
7        atomic::{AtomicU16, Ordering},
8        Arc,
9    },
10    time::SystemTime,
11};
12
13use crate::store::{handle, types, RefreshMode};
14
15pub(crate) struct Snapshot {
16    /// Indices ready for object lookup or contains checks, ordered usually by modification data, recent ones first.
17    pub(crate) indices: Vec<handle::IndexLookup>,
18    /// A set of loose objects dbs to search once packed objects weren't found.
19    pub(crate) loose_dbs: Arc<Vec<crate::loose::Store>>,
20    /// remember what this state represents and to compare to other states.
21    pub(crate) marker: types::SlotIndexMarker,
22}
23
24mod error {
25    use std::path::PathBuf;
26
27    use gix_pack::multi_index::PackIndex;
28
29    /// Returned by [`crate::at_opts()`]
30    #[derive(thiserror::Error, Debug)]
31    #[allow(missing_docs)]
32    pub enum Error {
33        #[error("The objects directory at '{0}' is not an accessible directory")]
34        Inaccessible(PathBuf),
35        #[error(transparent)]
36        Io(#[from] std::io::Error),
37        #[error(transparent)]
38        Alternate(#[from] crate::alternate::Error),
39        #[error("The slotmap turned out to be too small with {} entries, would need {} more", .current, .needed)]
40        InsufficientSlots { current: usize, needed: usize },
41        /// The problem here is that some logic assumes that more recent generations are higher than previous ones. If we would overflow,
42        /// we would break that invariant which can lead to the wrong object from being returned. It would probably be super rare, but…
43        /// let's not risk it.
44        #[error(
45            "Would have overflown amount of max possible generations of {}",
46            super::Generation::MAX
47        )]
48        GenerationOverflow,
49        #[error("Cannot numerically handle more than {limit} packs in a single multi-pack index, got {actual} in file {index_path:?}")]
50        TooManyPacksInMultiIndex {
51            actual: PackIndex,
52            limit: PackIndex,
53            index_path: PathBuf,
54        },
55    }
56}
57
58pub use error::Error;
59
60use crate::store::types::{Generation, IndexAndPacks, MutableIndexAndPack, PackId, SlotMapIndex};
61
62impl super::Store {
63    /// Load all indices, refreshing from disk only if needed.
64    pub(crate) fn load_all_indices(&self) -> Result<Snapshot, Error> {
65        let mut snapshot = self.collect_snapshot();
66        while let Some(new_snapshot) = self.load_one_index(RefreshMode::Never, snapshot.marker)? {
67            snapshot = new_snapshot;
68        }
69        Ok(snapshot)
70    }
71
72    /// If `None` is returned, there is new indices and the caller should give up. This is a possibility even if it's allowed to refresh
73    /// as here might be no change to pick up.
74    pub(crate) fn load_one_index(
75        &self,
76        refresh_mode: RefreshMode,
77        marker: types::SlotIndexMarker,
78    ) -> Result<Option<Snapshot>, Error> {
79        let index = self.index.load();
80        if !index.is_initialized() {
81            return self.consolidate_with_disk_state(true /* needs_init */, false /*load one new index*/);
82        }
83
84        if marker.generation != index.generation || marker.state_id != index.state_id() {
85            // We have a more recent state already, provide it.
86            Ok(Some(self.collect_snapshot()))
87        } else {
88            // always compare to the latest state
89            // Nothing changed in the meantime, try to load another index…
90            if self.load_next_index(index) {
91                Ok(Some(self.collect_snapshot()))
92            } else {
93                // …and if that didn't yield anything new consider refreshing our disk state.
94                match refresh_mode {
95                    RefreshMode::Never => Ok(None),
96                    RefreshMode::AfterAllIndicesLoaded => {
97                        self.consolidate_with_disk_state(false /* needs init */, true /*load one new index*/)
98                    }
99                }
100            }
101        }
102    }
103
104    /// load a new index (if not yet loaded), and return true if one was indeed loaded (leading to a `state_id()` change) of the current index.
105    /// Note that interacting with the slot-map is inherently racy and we have to deal with it, being conservative in what we even try to load
106    /// as our index might already be out-of-date as we try to use it to learn what's next.
107    fn load_next_index(&self, mut index: arc_swap::Guard<Arc<SlotMapIndex>>) -> bool {
108        'retry_with_changed_index: loop {
109            let previous_state_id = index.state_id();
110            'retry_with_next_slot_index: loop {
111                match index
112                    .next_index_to_load
113                    .fetch_update(Ordering::SeqCst, Ordering::SeqCst, |current| {
114                        (current != index.slot_indices.len()).then_some(current + 1)
115                    }) {
116                    Ok(slot_map_index) => {
117                        // This slot-map index is in bounds and was only given to us.
118                        let _ongoing_operation = IncOnNewAndDecOnDrop::new(&index.num_indices_currently_being_loaded);
119                        let slot = &self.files[index.slot_indices[slot_map_index]];
120                        let _lock = slot.write.lock();
121                        if slot.generation.load(Ordering::SeqCst) > index.generation {
122                            // There is a disk consolidation in progress which just overwrote a slot that could be disposed with some other
123                            // index, one we didn't intend to load.
124                            // Continue with the next slot index in the hope there is something else we can do…
125                            continue 'retry_with_next_slot_index;
126                        }
127                        let mut bundle = slot.files.load_full();
128                        let bundle_mut = Arc::make_mut(&mut bundle);
129                        if let Some(files) = bundle_mut.as_mut() {
130                            // these are always expected to be set, unless somebody raced us. We handle this later by retrying.
131                            let res = {
132                                let res = files.load_index(self.object_hash);
133                                slot.files.store(bundle);
134                                index.loaded_indices.fetch_add(1, Ordering::SeqCst);
135                                res
136                            };
137                            match res {
138                                Ok(_) => {
139                                    break 'retry_with_next_slot_index;
140                                }
141                                Err(_err) => {
142                                    gix_features::trace::error!(err=?_err, "Failed to load index file - some objects may seem to not exist");
143                                    continue 'retry_with_next_slot_index;
144                                }
145                            }
146                        }
147                    }
148                    Err(_nothing_more_to_load) => {
149                        // There can be contention as many threads start working at the same time and take all the
150                        // slots to load indices for. Some threads might just be left-over and have to wait for something
151                        // to change.
152                        // TODO: potentially hot loop - could this be a condition variable?
153                        // This is a timing-based fix for the case that the `num_indices_being_loaded` isn't yet incremented,
154                        // and we might break out here without actually waiting for the loading operation. Then we'd fail to
155                        // observe a change and the underlying handler would not have all the indices it needs at its disposal.
156                        // Yielding means we will definitely loose enough time to observe the ongoing operation,
157                        // or its effects.
158                        std::thread::yield_now();
159                        while index.num_indices_currently_being_loaded.load(Ordering::SeqCst) != 0 {
160                            std::thread::yield_now();
161                        }
162                        break 'retry_with_next_slot_index;
163                    }
164                }
165            }
166            if previous_state_id == index.state_id() {
167                let potentially_new_index = self.index.load();
168                if Arc::as_ptr(&potentially_new_index) == Arc::as_ptr(&index) {
169                    // There isn't a new index with which to retry the whole ordeal, so nothing could be done here.
170                    return false;
171                } else {
172                    // the index changed, worth trying again
173                    index = potentially_new_index;
174                    continue 'retry_with_changed_index;
175                }
176            } else {
177                // something inarguably changed, probably an index was loaded. 'probably' because we consider failed loads valid attempts,
178                // even they don't change anything for the caller which would then do a round for nothing.
179                return true;
180            }
181        }
182    }
183
184    /// refresh and possibly clear out our existing data structures, causing all pack ids to be invalidated.
185    /// `load_new_index` is an optimization to at least provide one newly loaded pack after refreshing the slot map.
186    pub(crate) fn consolidate_with_disk_state(
187        &self,
188        needs_init: bool,
189        load_new_index: bool,
190    ) -> Result<Option<Snapshot>, Error> {
191        let index = self.index.load();
192        let previous_index_state = Arc::as_ptr(&index) as usize;
193
194        // IMPORTANT: get a lock after we recorded the previous state.
195        let write = self.write.lock();
196        let objects_directory = &self.path;
197
198        // Now we know the index isn't going to change anymore, even though threads might still load indices in the meantime.
199        let index = self.index.load();
200        if previous_index_state != Arc::as_ptr(&index) as usize {
201            // Someone else took the look before and changed the index. Return it without doing any additional work.
202            return Ok(Some(self.collect_snapshot()));
203        }
204
205        let was_uninitialized = !index.is_initialized();
206
207        // We might not be able to detect by pointer if the state changed, as this itself is racy. So we keep track of double-initialization
208        // using a flag, which means that if `needs_init` was true we saw the index uninitialized once, but now that we are here it's
209        // initialized meaning that somebody was faster, and we couldn't detect it by comparisons to the index.
210        // If so, make sure we collect the snapshot instead of returning None in case nothing actually changed, which is likely with a
211        // race like this.
212        if !was_uninitialized && needs_init {
213            return Ok(Some(self.collect_snapshot()));
214        }
215        self.num_disk_state_consolidation.fetch_add(1, Ordering::Relaxed);
216
217        let db_paths: Vec<_> = std::iter::once(objects_directory.to_owned())
218            .chain(crate::alternate::resolve(objects_directory.clone(), &self.current_dir)?)
219            .collect();
220
221        // turn db paths into loose object databases. Reuse what's there, but only if it is in the right order.
222        let loose_dbs = if was_uninitialized
223            || db_paths.len() != index.loose_dbs.len()
224            || db_paths
225                .iter()
226                .zip(index.loose_dbs.iter().map(|ldb| &ldb.path))
227                .any(|(lhs, rhs)| lhs != rhs)
228        {
229            Arc::new(
230                db_paths
231                    .iter()
232                    .map(|path| crate::loose::Store::at(path, self.object_hash))
233                    .collect::<Vec<_>>(),
234            )
235        } else {
236            Arc::clone(&index.loose_dbs)
237        };
238
239        let indices_by_modification_time = Self::collect_indices_and_mtime_sorted_by_size(
240            db_paths,
241            index.slot_indices.len().into(),
242            self.use_multi_pack_index.then_some(self.object_hash),
243        )?;
244        let mut idx_by_index_path: BTreeMap<_, _> = index
245            .slot_indices
246            .iter()
247            .filter_map(|&idx| {
248                let f = &self.files[idx];
249                Option::as_ref(&f.files.load()).map(|f| (f.index_path().to_owned(), idx))
250            })
251            .collect();
252
253        let mut new_slot_map_indices = Vec::new(); // these indices into the slot map still exist there/didn't change
254        let mut index_paths_to_add = was_uninitialized
255            .then(|| VecDeque::with_capacity(indices_by_modification_time.len()))
256            .unwrap_or_default();
257
258        // Figure out this number based on what we see while handling the existing indices
259        let mut num_loaded_indices = 0;
260        for (index_info, mtime) in indices_by_modification_time.into_iter().map(|(a, b, _)| (a, b)) {
261            match idx_by_index_path.remove(index_info.path()) {
262                Some(slot_idx) => {
263                    let slot = &self.files[slot_idx];
264                    let files_guard = slot.files.load();
265                    let files =
266                        Option::as_ref(&files_guard).expect("slot is set or we wouldn't know it points to this file");
267                    if index_info.is_multi_index() && files.mtime() != mtime {
268                        // we have a changed multi-pack index. We can't just change the existing slot as it may alter slot indices
269                        // that are currently available. Instead, we have to move what's there into a new slot, along with the changes,
270                        // and later free the slot or dispose of the index in the slot (like we do for removed/missing files).
271                        index_paths_to_add.push_back((index_info, mtime, Some(slot_idx)));
272                        // If the current slot is loaded, the soon-to-be copied multi-index path will be loaded as well.
273                        if files.index_is_loaded() {
274                            num_loaded_indices += 1;
275                        }
276                    } else {
277                        // packs and indices are immutable, so no need to check modification times. Unchanged multi-pack indices also
278                        // are handled like this just to be sure they are in the desired state. For these, the only way this could happen
279                        // is if somebody deletes and then puts back
280                        if Self::assure_slot_matches_index(&write, slot, index_info, mtime, index.generation) {
281                            num_loaded_indices += 1;
282                        }
283                        new_slot_map_indices.push(slot_idx);
284                    }
285                }
286                None => index_paths_to_add.push_back((index_info, mtime, None)),
287            }
288        }
289        let needs_stable_indices = self.maintain_stable_indices(&write);
290
291        let mut next_possibly_free_index = index
292            .slot_indices
293            .iter()
294            .max()
295            .map_or(0, |idx| (idx + 1) % self.files.len());
296        let mut num_indices_checked = 0;
297        let mut needs_generation_change = false;
298        let mut slot_indices_to_remove: Vec<_> = idx_by_index_path.into_values().collect();
299        while let Some((mut index_info, mtime, move_from_slot_idx)) = index_paths_to_add.pop_front() {
300            'increment_slot_index: loop {
301                if num_indices_checked == self.files.len() {
302                    return Err(Error::InsufficientSlots {
303                        current: self.files.len(),
304                        needed: index_paths_to_add.len() + 1, /*the one currently popped off*/
305                    });
306                }
307                // Don't allow duplicate indicates, we need a 1:1 mapping.
308                if new_slot_map_indices.contains(&next_possibly_free_index) {
309                    next_possibly_free_index = (next_possibly_free_index + 1) % self.files.len();
310                    num_indices_checked += 1;
311                    continue 'increment_slot_index;
312                }
313                let slot_index = next_possibly_free_index;
314                let slot = &self.files[slot_index];
315                next_possibly_free_index = (next_possibly_free_index + 1) % self.files.len();
316                num_indices_checked += 1;
317                match move_from_slot_idx {
318                    Some(move_from_slot_idx) => {
319                        debug_assert!(index_info.is_multi_index(), "only set for multi-pack indices");
320                        if slot_index == move_from_slot_idx {
321                            // don't try to move onto ourselves
322                            continue 'increment_slot_index;
323                        }
324                        match Self::try_set_index_slot(
325                            &write,
326                            slot,
327                            index_info,
328                            mtime,
329                            index.generation,
330                            needs_stable_indices,
331                        ) {
332                            Ok(dest_was_empty) => {
333                                slot_indices_to_remove.push(move_from_slot_idx);
334                                new_slot_map_indices.push(slot_index);
335                                // To avoid handling out the wrong pack (due to reassigned pack ids), declare this a new generation.
336                                if !dest_was_empty {
337                                    needs_generation_change = true;
338                                }
339                                break 'increment_slot_index;
340                            }
341                            Err(unused_index_info) => index_info = unused_index_info,
342                        }
343                    }
344                    None => {
345                        match Self::try_set_index_slot(
346                            &write,
347                            slot,
348                            index_info,
349                            mtime,
350                            index.generation,
351                            needs_stable_indices,
352                        ) {
353                            Ok(dest_was_empty) => {
354                                new_slot_map_indices.push(slot_index);
355                                if !dest_was_empty {
356                                    needs_generation_change = true;
357                                }
358                                break 'increment_slot_index;
359                            }
360                            Err(unused_index_info) => index_info = unused_index_info,
361                        }
362                    }
363                }
364                // This isn't racy as it's only us who can change the Option::Some/None state of a slot.
365            }
366        }
367        assert_eq!(
368            index_paths_to_add.len(),
369            0,
370            "By this time we have assigned all new files to slots"
371        );
372
373        let generation = if needs_generation_change {
374            index.generation.checked_add(1).ok_or(Error::GenerationOverflow)?
375        } else {
376            index.generation
377        };
378        let index_unchanged = index.slot_indices == new_slot_map_indices;
379        if generation != index.generation {
380            assert!(
381                !index_unchanged,
382                "if the generation changed, the slot index must have changed for sure"
383            );
384        }
385        if !index_unchanged || loose_dbs != index.loose_dbs {
386            let new_index = Arc::new(SlotMapIndex {
387                slot_indices: new_slot_map_indices,
388                loose_dbs,
389                generation,
390                // if there was a prior generation, some indices might already be loaded. But we deal with it by trying to load the next index then,
391                // until we find one.
392                next_index_to_load: index_unchanged
393                    .then(|| Arc::clone(&index.next_index_to_load))
394                    .unwrap_or_default(),
395                loaded_indices: index_unchanged
396                    .then(|| Arc::clone(&index.loaded_indices))
397                    .unwrap_or_else(|| Arc::new(num_loaded_indices.into())),
398                num_indices_currently_being_loaded: Default::default(),
399            });
400            self.index.store(new_index);
401        }
402
403        // deleted items - remove their slots AFTER we have set the new index if we may alter indices, otherwise we only declare them garbage.
404        // removing slots may cause pack loading to fail, and they will then reload their indices.
405        for slot in slot_indices_to_remove.into_iter().map(|idx| &self.files[idx]) {
406            let _lock = slot.write.lock();
407            let mut files = slot.files.load_full();
408            let files_mut = Arc::make_mut(&mut files);
409            if needs_stable_indices {
410                if let Some(files) = files_mut.as_mut() {
411                    files.trash();
412                    // generation stays the same, as it's the same value still but scheduled for eventual removal.
413                }
414            } else {
415                // set the generation before we actually change the value, otherwise readers of old generations could observe the new one.
416                // We rather want them to turn around here and update their index, which, by that time, might actually already be available.
417                // If not, they would fail unable to load a pack or index they need, but that's preferred over returning wrong objects.
418                // Safety: can't race as we hold the lock, have to set the generation beforehand to help avoid others to observe the value.
419                slot.generation.store(generation, Ordering::SeqCst);
420                *files_mut = None;
421            };
422            slot.files.store(files);
423        }
424
425        let new_index = self.index.load();
426        Ok(if index.state_id() == new_index.state_id() {
427            // there was no change, and nothing was loaded in the meantime, reflect that in the return value to not get into loops.
428            None
429        } else {
430            if load_new_index {
431                self.load_next_index(new_index);
432            }
433            Some(self.collect_snapshot())
434        })
435    }
436
437    pub(crate) fn collect_indices_and_mtime_sorted_by_size(
438        db_paths: Vec<PathBuf>,
439        initial_capacity: Option<usize>,
440        multi_pack_index_object_hash: Option<gix_hash::Kind>,
441    ) -> Result<Vec<(Either, SystemTime, u64)>, Error> {
442        let mut indices_by_modification_time = Vec::with_capacity(initial_capacity.unwrap_or_default());
443        for db_path in db_paths {
444            let packs = db_path.join("pack");
445            let entries = match std::fs::read_dir(packs) {
446                Ok(e) => e,
447                Err(err) if err.kind() == std::io::ErrorKind::NotFound => continue,
448                Err(err) => return Err(err.into()),
449            };
450            let indices = entries
451                .filter_map(Result::ok)
452                .filter_map(|e| e.metadata().map(|md| (e.path(), md)).ok())
453                .filter(|(_, md)| md.file_type().is_file())
454                .filter(|(p, _)| {
455                    let ext = p.extension();
456                    (ext == Some(OsStr::new("idx")) && p.with_extension("pack").is_file())
457                        || (multi_pack_index_object_hash.is_some() && ext.is_none() && is_multipack_index(p))
458                })
459                .map(|(p, md)| md.modified().map_err(Error::from).map(|mtime| (p, mtime, md.len())))
460                .collect::<Result<Vec<_>, _>>()?;
461
462            let multi_index_info = multi_pack_index_object_hash
463                .and_then(|hash| {
464                    indices.iter().find_map(|(p, a, b)| {
465                        is_multipack_index(p)
466                            .then(|| {
467                                // we always open the multi-pack here to be able to remove indices
468                                gix_pack::multi_index::File::at(p)
469                                    .ok()
470                                    .filter(|midx| midx.object_hash() == hash)
471                                    .map(|midx| (midx, *a, *b))
472                            })
473                            .flatten()
474                            .map(|t| {
475                                if t.0.num_indices() > PackId::max_packs_in_multi_index() {
476                                    Err(Error::TooManyPacksInMultiIndex {
477                                        index_path: p.to_owned(),
478                                        actual: t.0.num_indices(),
479                                        limit: PackId::max_packs_in_multi_index(),
480                                    })
481                                } else {
482                                    Ok(t)
483                                }
484                            })
485                    })
486                })
487                .transpose()?;
488            if let Some((multi_index, mtime, flen)) = multi_index_info {
489                let index_names_in_multi_index: Vec<_> = multi_index.index_names().iter().map(AsRef::as_ref).collect();
490                let mut indices_not_in_multi_index: Vec<(Either, _, _)> = indices
491                    .into_iter()
492                    .filter_map(|(path, a, b)| {
493                        (path != multi_index.path()
494                            && !index_names_in_multi_index
495                                .contains(&Path::new(path.file_name().expect("file name present"))))
496                        .then_some((Either::IndexPath(path), a, b))
497                    })
498                    .collect();
499                indices_not_in_multi_index.insert(0, (Either::MultiIndexFile(Arc::new(multi_index)), mtime, flen));
500                indices_by_modification_time.extend(indices_not_in_multi_index);
501            } else {
502                indices_by_modification_time.extend(
503                    indices
504                        .into_iter()
505                        .filter_map(|(p, a, b)| (!is_multipack_index(&p)).then_some((Either::IndexPath(p), a, b))),
506                );
507            }
508        }
509        // Unlike libgit2, do not sort by modification date, but by size and put the biggest indices first. That way
510        // the chance to hit an object should be higher. We leave it to the handle to sort by LRU.
511        // Git itself doesn't change the order which may save time, but we want it to be stable which also helps some tests.
512        // NOTE: this will work well for well-packed repos or those using geometric repacking, but force us to open a lot
513        //       of files when dealing with new objects, as there is no notion of recency here as would be with unmaintained
514        //       repositories. Different algorithms should be provided, like newest packs first, and possibly a mix of both
515        //       with big packs first, then sorting by recency for smaller packs.
516        //       We also want to implement `fetch.unpackLimit` to alleviate this issue a little.
517        indices_by_modification_time.sort_by(|l, r| l.2.cmp(&r.2).reverse());
518        Ok(indices_by_modification_time)
519    }
520
521    /// returns `Ok(dest_slot_was_empty)` if the copy could happen because dest-slot was actually free or disposable.
522    #[allow(clippy::too_many_arguments)]
523    fn try_set_index_slot(
524        lock: &parking_lot::MutexGuard<'_, ()>,
525        dest_slot: &MutableIndexAndPack,
526        index_info: Either,
527        mtime: SystemTime,
528        current_generation: Generation,
529        needs_stable_indices: bool,
530    ) -> Result<bool, Either> {
531        let (dest_slot_was_empty, generation) = match &**dest_slot.files.load() {
532            Some(bundle) => {
533                if bundle.index_path() == index_info.path() || (bundle.is_disposable() && needs_stable_indices) {
534                    // it might be possible to see ourselves in case all slots are taken, but there are still a few more destination
535                    // slots to look for.
536                    return Err(index_info);
537                }
538                // Since we overwrite an existing slot, we have to increment the generation to prevent anyone from trying to use it while
539                // before we are replacing it with a different value.
540                // In detail:
541                // We need to declare this to be the future to avoid anything in that slot to be returned to people who
542                // last saw the old state. They will then try to get a new index which by that time, might be happening
543                // in time so they get the latest one. If not, they will probably get into the same situation again until
544                // it finally succeeds. Alternatively, the object will be reported unobtainable, but at least it won't return
545                // some other object.
546                (false, current_generation + 1)
547            }
548            None => {
549                // For multi-pack indices:
550                //   Do NOT copy the packs over, they need to be reopened to get the correct pack id matching the new slot map index.
551                //   If we are allowed to delete the original, and nobody has the pack referenced, it is closed which is preferred.
552                //   Thus we simply always start new with packs in multi-pack indices.
553                //   In the worst case this could mean duplicate file handle usage though as the old and the new index can't share
554                //   packs due to the intrinsic id.
555                //   Note that the ID is used for cache access, too, so it must be unique. It must also be mappable from pack-id to slotmap id.
556                (true, current_generation)
557            }
558        };
559        Self::set_slot_to_index(lock, dest_slot, index_info, mtime, generation);
560        Ok(dest_slot_was_empty)
561    }
562
563    fn set_slot_to_index(
564        _lock: &parking_lot::MutexGuard<'_, ()>,
565        slot: &MutableIndexAndPack,
566        index_info: Either,
567        mtime: SystemTime,
568        generation: Generation,
569    ) {
570        let _lock = slot.write.lock();
571        let mut files = slot.files.load_full();
572        let files_mut = Arc::make_mut(&mut files);
573        // set the generation before we actually change the value, otherwise readers of old generations could observe the new one.
574        // We rather want them to turn around here and update their index, which, by that time, might actually already be available.
575        // If not, they would fail unable to load a pack or index they need, but that's preferred over returning wrong objects.
576        // Safety: can't race as we hold the lock, have to set the generation beforehand to help avoid others to observe the value.
577        slot.generation.store(generation, Ordering::SeqCst);
578        *files_mut = Some(index_info.into_index_and_packs(mtime));
579        slot.files.store(files);
580    }
581
582    /// Returns true if the index was left in a loaded state.
583    fn assure_slot_matches_index(
584        _lock: &parking_lot::MutexGuard<'_, ()>,
585        slot: &MutableIndexAndPack,
586        index_info: Either,
587        mtime: SystemTime,
588        current_generation: Generation,
589    ) -> bool {
590        match Option::as_ref(&slot.files.load()) {
591            Some(bundle) => {
592                assert_eq!(
593                    bundle.index_path(),
594                    index_info.path(),
595                    "Parallel writers cannot change the file the slot points to."
596                );
597                if bundle.is_disposable() {
598                    // put it into the correct mode, it's now available for sure so should not be missing or garbage.
599                    // The latter can happen if files are removed and put back for some reason, but we should definitely
600                    // have them in a decent state now that we know/think they are there.
601                    let _lock = slot.write.lock();
602                    let mut files = slot.files.load_full();
603                    let files_mut = Arc::make_mut(&mut files)
604                        .as_mut()
605                        .expect("BUG: cannot change from something to nothing, would be race");
606                    files_mut.put_back();
607                    debug_assert_eq!(
608                        files_mut.mtime(),
609                        mtime,
610                        "BUG: we can only put back files that didn't obviously change"
611                    );
612                    // Safety: can't race as we hold the lock, must be set before replacing the data.
613                    // NOTE that we don't change the generation as it's still the very same index we talk about, it doesn't change
614                    // identity.
615                    slot.generation.store(current_generation, Ordering::SeqCst);
616                    slot.files.store(files);
617                } else {
618                    // it's already in the correct state, either loaded or unloaded.
619                }
620                bundle.index_is_loaded()
621            }
622            None => {
623                unreachable!("BUG: a slot can never be deleted if we have it recorded in the index WHILE changing said index. There shouldn't be a race")
624            }
625        }
626    }
627
628    /// Stability means that indices returned by this API will remain valid.
629    /// Without that constraint, we may unload unused packs and indices, and may rebuild the slotmap index.
630    ///
631    /// Note that this must be called with a lock to the relevant state held to assure these values don't change while
632    /// we are working on said index.
633    fn maintain_stable_indices(&self, _guard: &parking_lot::MutexGuard<'_, ()>) -> bool {
634        self.num_handles_stable.load(Ordering::SeqCst) > 0
635    }
636
637    pub(crate) fn collect_snapshot(&self) -> Snapshot {
638        // We don't observe changes-on-disk in our 'wait-for-load' loop.
639        // That loop is meant to help assure the marker (which includes the amount of loaded indices) matches
640        // the actual amount of indices we collect.
641        let index = self.index.load();
642        loop {
643            if index.num_indices_currently_being_loaded.deref().load(Ordering::SeqCst) != 0 {
644                std::thread::yield_now();
645                continue;
646            }
647            let marker = index.marker();
648            let indices = if index.is_initialized() {
649                index
650                    .slot_indices
651                    .iter()
652                    .map(|idx| (*idx, &self.files[*idx]))
653                    .filter_map(|(id, file)| {
654                        let lookup = match (**file.files.load()).as_ref()? {
655                            types::IndexAndPacks::Index(bundle) => handle::SingleOrMultiIndex::Single {
656                                index: bundle.index.loaded()?.clone(),
657                                data: bundle.data.loaded().cloned(),
658                            },
659                            types::IndexAndPacks::MultiIndex(multi) => handle::SingleOrMultiIndex::Multi {
660                                index: multi.multi_index.loaded()?.clone(),
661                                data: multi.data.iter().map(|f| f.loaded().cloned()).collect(),
662                            },
663                        };
664                        handle::IndexLookup { file: lookup, id }.into()
665                    })
666                    .collect()
667            } else {
668                Vec::new()
669            };
670
671            return Snapshot {
672                indices,
673                loose_dbs: Arc::clone(&index.loose_dbs),
674                marker,
675            };
676        }
677    }
678}
679
680// Outside of this method we will never assign new slot indices.
681fn is_multipack_index(path: &Path) -> bool {
682    path.file_name() == Some(OsStr::new("multi-pack-index"))
683}
684
685struct IncOnNewAndDecOnDrop<'a>(&'a AtomicU16);
686impl<'a> IncOnNewAndDecOnDrop<'a> {
687    pub fn new(v: &'a AtomicU16) -> Self {
688        v.fetch_add(1, Ordering::SeqCst);
689        Self(v)
690    }
691}
692impl Drop for IncOnNewAndDecOnDrop<'_> {
693    fn drop(&mut self) {
694        self.0.fetch_sub(1, Ordering::SeqCst);
695    }
696}
697
698pub(crate) enum Either {
699    IndexPath(PathBuf),
700    MultiIndexFile(Arc<gix_pack::multi_index::File>),
701}
702
703impl Either {
704    fn path(&self) -> &Path {
705        match self {
706            Either::IndexPath(p) => p,
707            Either::MultiIndexFile(f) => f.path(),
708        }
709    }
710
711    fn into_index_and_packs(self, mtime: SystemTime) -> IndexAndPacks {
712        match self {
713            Either::IndexPath(path) => IndexAndPacks::new_single(path, mtime),
714            Either::MultiIndexFile(file) => IndexAndPacks::new_multi_from_open_file(file, mtime),
715        }
716    }
717
718    fn is_multi_index(&self) -> bool {
719        matches!(self, Either::MultiIndexFile(_))
720    }
721}
722
723impl Eq for Either {}
724
725impl PartialEq<Self> for Either {
726    fn eq(&self, other: &Self) -> bool {
727        self.path().eq(other.path())
728    }
729}
730
731impl PartialOrd<Self> for Either {
732    fn partial_cmp(&self, other: &Self) -> Option<std::cmp::Ordering> {
733        Some(self.path().cmp(other.path()))
734    }
735}
736
737impl Ord for Either {
738    fn cmp(&self, other: &Self) -> std::cmp::Ordering {
739        self.path().cmp(other.path())
740    }
741}