1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
/*
 * Copyright (C) 2023  The Software Heritage developers
 * See the AUTHORS file at the top-level directory of this distribution
 * License: GNU General Public License version 3, or any later version
 * See top-level LICENSE file for more information
 */

use std::path::{Path, PathBuf};

use anyhow::{anyhow, Context, Result};

use crate::SWHType;

#[cfg(feature = "dataset-writer")]
pub mod dataset_writer;
pub mod mmap;
pub mod shuffle;
pub mod sort;

pub fn dir_size(path: &Path) -> Result<usize> {
    Ok(std::fs::read_dir(path)
        .with_context(|| format!("Could not list {}", path.display()))?
        .map(|entry| {
            entry
                .unwrap_or_else(|e| panic!("Could not read {} entry: {:?}", path.display(), e))
                .metadata()
                .as_ref()
                .unwrap_or_else(|e| panic!("Could not read {} entry: {:?}", path.display(), e))
                .len() as usize
        })
        .sum::<usize>())
}

/// Appends a string to a path
///
/// ```
/// # use std::path::{Path, PathBuf};
/// # use swh_graph::utils::suffix_path;
///
/// assert_eq!(
///     suffix_path(Path::new("/tmp/graph"), "-transposed"),
///     Path::new("/tmp/graph-transposed").to_owned()
/// );
/// ```
#[inline(always)]
pub fn suffix_path<P: AsRef<Path>, S: AsRef<std::ffi::OsStr>>(path: P, suffix: S) -> PathBuf {
    let mut path = path.as_ref().as_os_str().to_owned();
    path.push(suffix);
    path.into()
}

/// Given a string like `*` or `cnt,dir,rev,rel,snp,ori`, returns a list of `SWHType`
/// matching the string.
pub fn parse_allowed_node_types(s: &str) -> Result<Vec<SWHType>> {
    if s == "*" {
        Ok(SWHType::all())
    } else {
        let mut types = Vec::new();
        for type_ in s.split(',') {
            types.push(
                type_
                    .try_into()
                    .map_err(|s| anyhow!("Could not parse --allowed-node-types {s}"))?,
            );
        }
        Ok(types)
    }
}

#[allow(clippy::len_without_is_empty)]
pub trait GetIndex {
    type Output;

    /// Returns the total number of items in the collections
    fn len(&self) -> usize;

    /// Returns an item of the collection
    fn get(&self, index: usize) -> Option<Self::Output>;

    /// Returns an item of the collection
    ///
    /// # Safety
    ///
    /// Undefined behavior if the index is past the end of the collection.
    unsafe fn get_unchecked(&self, index: usize) -> Self::Output;
}

impl<Item: Clone, T: std::ops::Deref<Target = [Item]>> GetIndex for T {
    type Output = Item;

    fn len(&self) -> usize {
        <[Item]>::len(self)
    }

    fn get(&self, index: usize) -> Option<Self::Output> {
        <[Item]>::get(self, index).cloned()
    }

    unsafe fn get_unchecked(&self, index: usize) -> Self::Output {
        <[Item]>::get_unchecked(self, index).clone()
    }
}