From 826755f09d31718a14b3884d70988f9430021720 Mon Sep 17 00:00:00 2001 From: xzfc Date: Fri, 30 Aug 2024 22:28:31 +0000 Subject: [PATCH] feat: Add Builder::append_writer --- src/builder.rs | 127 +++++++++++++++++++++++++++++++++++++++++++++++++ src/lib.rs | 2 +- tests/all.rs | 39 +++++++++++++++ 3 files changed, 167 insertions(+), 1 deletion(-) diff --git a/src/builder.rs b/src/builder.rs index 9b799329..359c4966 100644 --- a/src/builder.rs +++ b/src/builder.rs @@ -165,6 +165,47 @@ impl Builder { self.append(&header, data) } + /// Adds a new entry to this archive and returns an [`EntryWriter`] for + /// adding its contents. + /// + /// This function is similar to [`Self::append_data`] but returns a + /// [`io::Write`] implementation instead of taking data as a parameter. + /// + /// Similar constraints around the position of the archive and completion + /// apply as with [`Self::append_data`]. It requires the underlying writer + /// to implement [`Seek`] to update the header after writing the data. + /// + /// # Errors + /// + /// This function will return an error for any intermittent I/O error which + /// occurs when either reading or writing. + /// + /// # Examples + /// + /// ``` + /// use std::io::Cursor; + /// use std::io::Write as _; + /// use tar::{Builder, Header}; + /// + /// let mut header = Header::new_gnu(); + /// + /// let mut ar = Builder::new(Cursor::new(Vec::new())); + /// let mut entry = ar.append_writer(&mut header, "hi.txt").unwrap(); + /// entry.write_all(b"Hello, ").unwrap(); + /// entry.write_all(b"world!\n").unwrap(); + /// entry.finish().unwrap(); + /// ``` + pub fn append_writer<'a, P: AsRef>( + &'a mut self, + header: &'a mut Header, + path: P, + ) -> io::Result> + where + W: Seek, + { + EntryWriter::start(self.get_mut(), header, path.as_ref()) + } + /// Adds a new link (symbolic or hard) entry to this archive with the specified path and target. /// /// This function is similar to [`Self::append_data`] which supports long filenames, @@ -440,6 +481,92 @@ impl Builder { } } +trait SeekWrite: Write + Seek { + fn as_write(&mut self) -> &mut dyn Write; +} + +impl SeekWrite for T { + fn as_write(&mut self) -> &mut dyn Write { + self + } +} + +/// A writer for a single entry in a tar archive. +/// +/// This struct is returned by [`Builder::append_writer`] and provides a +/// [`Write`] implementation for adding content to an archive entry. +/// +/// After writing all data to the entry, it must be finalized either by +/// explicitly calling [`EntryWriter::finish`] or by letting it drop. +pub struct EntryWriter<'a> { + obj: &'a mut dyn SeekWrite, + header: &'a mut Header, + written: u64, +} + +impl EntryWriter<'_> { + fn start<'a>( + obj: &'a mut dyn SeekWrite, + header: &'a mut Header, + path: &Path, + ) -> io::Result> { + prepare_header_path(obj.as_write(), header, path)?; + + // Write header stub. It will rewritten after all data will be written. + obj.write_all([0; 512].as_ref())?; + + Ok(EntryWriter { + obj, + header, + written: 0, + }) + } + + /// Finish writing the current entry in the archive. + pub fn finish(self) -> io::Result<()> { + let mut this = std::mem::ManuallyDrop::new(self); + this.do_finish() + } + + fn do_finish(&mut self) -> io::Result<()> { + // Pad with zeros if necessary. + let buf = [0; 512]; + let remaining = u64::wrapping_sub(512, self.written) % 512; + self.obj.write_all(&buf[..remaining as usize])?; + let written = (self.written + remaining) as i64; + + // Seek back to the header position. + self.obj.seek(io::SeekFrom::Current(-written - 512))?; + + self.header.set_size(self.written); + self.header.set_cksum(); + self.obj.write_all(self.header.as_bytes())?; + + // Seek forward to restore the position. + self.obj.seek(io::SeekFrom::Current(written))?; + + Ok(()) + } +} + +impl Write for EntryWriter<'_> { + fn write(&mut self, buf: &[u8]) -> io::Result { + let len = self.obj.write(buf)?; + self.written += len as u64; + Ok(len) + } + + fn flush(&mut self) -> io::Result<()> { + self.obj.flush() + } +} + +impl Drop for EntryWriter<'_> { + fn drop(&mut self) { + let _ = self.do_finish(); + } +} + fn append(mut dst: &mut dyn Write, header: &Header, mut data: &mut dyn Read) -> io::Result<()> { dst.write_all(header.as_bytes())?; let len = io::copy(&mut data, &mut dst)?; diff --git a/src/lib.rs b/src/lib.rs index 52251cd2..78d89a05 100644 --- a/src/lib.rs +++ b/src/lib.rs @@ -24,7 +24,7 @@ use std::io::{Error, ErrorKind}; pub use crate::archive::{Archive, Entries}; -pub use crate::builder::Builder; +pub use crate::builder::{Builder, EntryWriter}; pub use crate::entry::{Entry, Unpacked}; pub use crate::entry_type::EntryType; pub use crate::header::GnuExtSparseHeader; diff --git a/tests/all.rs b/tests/all.rs index 27a6fcf1..5ac28ce5 100644 --- a/tests/all.rs +++ b/tests/all.rs @@ -1043,6 +1043,45 @@ fn linkname_literal() { } } +#[test] +fn append_writer() { + let mut b = Builder::new(Cursor::new(Vec::new())); + + let mut h = Header::new_gnu(); + h.set_uid(42); + let mut writer = t!(b.append_writer(&mut h, "file1")); + t!(writer.write_all(b"foo")); + t!(writer.write_all(b"barbaz")); + t!(writer.finish()); + + let mut h = Header::new_gnu(); + h.set_uid(43); + let long_path: PathBuf = repeat("abcd").take(50).collect(); + let mut writer = t!(b.append_writer(&mut h, &long_path)); + let long_data = repeat(b'x').take(513).collect::>(); + t!(writer.write_all(&long_data)); + t!(writer.finish()); + + let contents = t!(b.into_inner()).into_inner(); + let mut ar = Archive::new(&contents[..]); + let mut entries = t!(ar.entries()); + + let e = &mut t!(entries.next().unwrap()); + assert_eq!(e.header().uid().unwrap(), 42); + assert_eq!(&*e.path_bytes(), b"file1"); + let mut r = Vec::new(); + t!(e.read_to_end(&mut r)); + assert_eq!(&r[..], b"foobarbaz"); + + let e = &mut t!(entries.next().unwrap()); + assert_eq!(e.header().uid().unwrap(), 43); + assert_eq!(t!(e.path()), long_path.as_path()); + let mut r = Vec::new(); + t!(e.read_to_end(&mut r)); + assert_eq!(r.len(), 513); + assert!(r.iter().all(|b| *b == b'x')); +} + #[test] fn encoded_long_name_has_trailing_nul() { let td = t!(TempBuilder::new().prefix("tar-rs").tempdir());