summaryrefslogtreecommitdiff
path: root/src/chunker.rs
blob: f424833b81fc129811ed20573209b585778928c2 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
use crate::checksummer::sha256;
use crate::chunk::DataChunk;
use crate::chunkmeta::ChunkMeta;
use std::io::prelude::*;

pub struct Chunker {
    chunk_size: usize,
    buf: Vec<u8>,
    handle: std::fs::File,
}

#[derive(Debug, thiserror::Error)]
pub enum ChunkerError {
    #[error(transparent)]
    IoError(#[from] std::io::Error),
}

pub type ChunkerResult<T> = Result<T, ChunkerError>;

impl Chunker {
    pub fn new(chunk_size: usize, handle: std::fs::File) -> Self {
        let mut buf = vec![];
        buf.resize(chunk_size, 0);
        Self {
            chunk_size,
            buf,
            handle,
        }
    }

    pub fn read_chunk(&mut self) -> ChunkerResult<Option<(ChunkMeta, DataChunk)>> {
        let mut used = 0;

        loop {
            let n = self.handle.read(&mut self.buf.as_mut_slice()[used..])?;
            used += n;
            if n == 0 || used == self.chunk_size {
                break;
            }
        }

        if used == 0 {
            return Ok(None);
        }

        let buffer = &self.buf.as_slice()[..used];
        let hash = sha256(buffer);
        let meta = ChunkMeta::new(&hash);
        let chunk = DataChunk::new(buffer.to_vec());
        Ok(Some((meta, chunk)))
    }
}

impl Iterator for Chunker {
    type Item = ChunkerResult<(ChunkMeta, DataChunk)>;

    fn next(&mut self) -> Option<ChunkerResult<(ChunkMeta, DataChunk)>> {
        match self.read_chunk() {
            Ok(None) => None,
            Ok(Some((meta, chunk))) => Some(Ok((meta, chunk))),
            Err(e) => Some(Err(e)),
        }
    }
}