ripgrep-all/src/caching_writer.rs

70 lines
2.1 KiB
Rust
Raw Normal View History

2019-06-05 19:28:35 +00:00
use failure::Fallible;
2019-06-07 21:17:33 +00:00
use log::*;
2019-06-06 21:43:30 +00:00
use std::io::Write;
2019-06-05 14:43:40 +00:00
/**
* wrap a writer so that it is passthrough,
2019-06-07 17:00:24 +00:00
* but also the written data is compressed and written into a buffer,
* unless more than max_cache_size bytes is written, then the cache is dropped and it is pure passthrough.
2019-06-05 14:43:40 +00:00
*/
pub struct CachingWriter<W: Write> {
max_cache_size: usize,
zstd_writer: Option<zstd::stream::write::Encoder<Vec<u8>>>,
out: W,
}
impl<W: Write> CachingWriter<W> {
pub fn new(
out: W,
max_cache_size: usize,
compression_level: i32,
2019-06-05 19:28:35 +00:00
) -> Fallible<CachingWriter<W>> {
2019-06-05 14:43:40 +00:00
Ok(CachingWriter {
out,
max_cache_size,
zstd_writer: Some(zstd::stream::write::Encoder::new(
Vec::new(),
compression_level,
)?),
})
}
pub fn finish(self) -> std::io::Result<Option<Vec<u8>>> {
if let Some(writer) = self.zstd_writer {
let res = writer.finish()?;
if res.len() <= self.max_cache_size {
Ok(Some(res))
} else {
// drop cache
Ok(None)
}
} else {
Ok(None)
}
}
}
impl<W: Write> Write for CachingWriter<W> {
fn write(&mut self, buf: &[u8]) -> std::io::Result<usize> {
match self.zstd_writer.as_mut() {
Some(writer) => {
let wrote = writer.write(buf)?;
let compressed_len = writer.get_ref().len();
2019-06-11 11:34:04 +00:00
trace!("wrote {} to zstd, len now {}", wrote, compressed_len);
2019-06-05 14:43:40 +00:00
if compressed_len > self.max_cache_size {
eprintln!("cache longer than max, dropping");
//writer.finish();
self.zstd_writer.take().unwrap().finish()?;
}
self.out.write_all(&buf[0..wrote])?;
2019-06-06 21:43:30 +00:00
Ok(wrote)
2019-06-05 14:43:40 +00:00
}
None => self.out.write(buf),
}
}
fn flush(&mut self) -> std::io::Result<()> {
eprintln!("flushing");
if let Some(writer) = self.zstd_writer.as_mut() {
writer.flush()?;
}
self.out.flush()
}
}