summaryrefslogtreecommitdiffstats
path: root/src/repository/fs.rs
blob: 435e2be39473e2bdf78e0c424475a35244569a91 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
use std::ops::Deref;
use std::path::Path;
use std::sync::Arc;

use anyhow::Error;
use anyhow::Result;
use tokio_stream::Stream;


/// Helper type to limit access to the filesystem in massive-parallel cases where we would run into
/// system error 24 ("too many open files").
#[derive(Clone)]
pub struct FileSystemAccessor {
    sem: Arc<tokio::sync::Semaphore>,
}

impl FileSystemAccessor {
    pub fn new(limit: usize) -> Self {
        FileSystemAccessor { sem: Arc::new(tokio::sync::Semaphore::new(limit)) }
    }

    #[inline]
    pub fn available_permits(&self) -> usize {
        self.sem.available_permits()
    }

    pub async fn read_dir(&self, path: impl AsRef<Path>) -> Result<impl Stream<Item = Result<DirEntry>>> {
        log::trace!("Accessor::read_dir({}): Acquiring Semaphore: {} - 1", path.as_ref().display(), self.available_permits());
        let perm = self.sem.acquire().await?;
        let sema = self.sem.clone();
        let mut read_dir = tokio::fs::read_dir(&path).await?;

        let stream = async_stream::stream! {
            loop {
                log::trace!("Accessor::read_dir(_): Acquiring Semaphore: {} - 1", sema.available_permits());
                let permit = sema.clone().acquire_owned().await?;
                if let Some(entry) = read_dir.next_entry().await? {
                    let dentry = DirEntry { permit, entry };
                    yield Ok(dentry) as Result<_>;
                } else {
                    break;
                }
            }
        };

        log::trace!("Accessor::read_dir({}): Dropping Semaphore: {} + 1", path.as_ref().display(), self.available_permits());
        drop(perm);
        Ok(stream)
    }

    pub async fn exists(&self, p: impl AsRef<Path>) -> Result<bool> {
        log::trace!("Accessor::exists({}): Acquiring Semaphore: {} - 1", p.as_ref().display(), self.available_permits());
        let perm = self.sem.acquire().await?;
        let r = p.as_ref().exists();
        log::trace!("Accessor::exists({}): Dropping Semaphore: {} + 1", p.as_ref().display(), self.available_permits());
        drop(perm);
        Ok(r)
    }

    pub async fn is_file(&self, p: impl AsRef<Path>) -> Result<bool> {
        log::trace!("Accessor::is_file({}): Acquiring Semaphore: {} - 1", p.as_ref().display(), self.available_permits());
        let perm = self.sem.acquire().await?;
        let r = p.as_ref().is_file();
        log::trace!("Accessor::is_file({}): Dropping Semaphore: {} + 1", p.as_ref().display(), self.available_permits());
        drop(perm);
        Ok(r)
    }

    pub async fn read_to_string(&self, p: impl AsRef<Path>) -> Result<String> {
        log::trace!("Accessor::read_to_string({}): Acquiring Semaphore: {} - 1", p.as_ref().display(), self.available_permits());
        let perm = self.sem.acquire().await?;
        let r = tokio::fs::read_to_string(&p).await.map_err(Error::from);
        log::trace!("Accessor::read_to_string({}): Dropping Semaphore: {} + 1", p.as_ref().display(), self.available_permits());
        drop(perm);
        r
    }
}

#[derive(Debug)]
pub struct DirEntry {
    permit: tokio::sync::OwnedSemaphorePermit,
    entry: tokio::fs::DirEntry,
}


impl Deref for DirEntry {
    type Target = tokio::fs::DirEntry;

    fn deref(&self) -> &Self::Target {
        &self.entry
    }
}