[pbs-devel] [PATCH pxar] fix `decode_entry` on special files
Dominik Csapak
d.csapak at proxmox.com
Tue Dec 15 12:08:53 CET 2020
looks good AFAICT
fixes the problem with fifo/sockets
Tested-By: Dominik Csapak <d.csapak at proxmox.com>
On 12/15/20 11:37 AM, Wolfgang Bumiller wrote:
> When using the random accessor to access FIFOs or sockets,
> the ranged reader limits the data to only that entry, and
> the `decode_entry` will never see a `PAYLOAD` or
> `GOODBYE_TABLE` item to finish the entry.
> Instead, it'll reach EOF and we need to handle this.
> The accessor now tells the decoder to expect EOF as a valid
> condition for ending the entry.
>
> Signed-off-by: Wolfgang Bumiller <w.bumiller at proxmox.com>
> ---
>
> The included testcase previously failed with
> "failed to decode entry for fifo0"
>
> src/accessor/mod.rs | 2 +-
> src/decoder/mod.rs | 52 +++++++++++++++++++++++++++++++++++---------
> tests/simple/main.rs | 46 +++++++++++++++++++++++++++++++++++++++
> 3 files changed, 89 insertions(+), 11 deletions(-)
>
> diff --git a/src/accessor/mod.rs b/src/accessor/mod.rs
> index 0ab03a6..d02dc13 100644
> --- a/src/accessor/mod.rs
> +++ b/src/accessor/mod.rs
> @@ -229,7 +229,7 @@ async fn get_decoder<T: ReadAt>(
> entry_range: Range<u64>,
> path: PathBuf,
> ) -> io::Result<DecoderImpl<SeqReadAtAdapter<T>>> {
> - Ok(DecoderImpl::new_full(SeqReadAtAdapter::new(input, entry_range), path).await?)
> + Ok(DecoderImpl::new_full(SeqReadAtAdapter::new(input, entry_range), path, true).await?)
> }
>
> // NOTE: This performs the Decoder::read_next_item() behavior! Keep in mind when changing!
> diff --git a/src/decoder/mod.rs b/src/decoder/mod.rs
> index fcc2dd9..2a5e79a 100644
> --- a/src/decoder/mod.rs
> +++ b/src/decoder/mod.rs
> @@ -155,6 +155,10 @@ pub(crate) struct DecoderImpl<T> {
> path_lengths: Vec<usize>,
> state: State,
> with_goodbye_tables: bool,
> +
> + /// The random access code uses decoders for sub-ranges which may not end in a `PAYLOAD` for
> + /// entries like FIFOs or sockets, so there we explicitly allow an item to terminate with EOF.
> + eof_after_entry: bool,
> }
>
> enum State {
> @@ -191,14 +195,18 @@ pub(crate) enum ItemResult {
>
> impl<I: SeqRead> DecoderImpl<I> {
> pub async fn new(input: I) -> io::Result<Self> {
> - Self::new_full(input, "/".into()).await
> + Self::new_full(input, "/".into(), false).await
> }
>
> pub(crate) fn input(&self) -> &I {
> &self.input
> }
>
> - pub(crate) async fn new_full(input: I, path: PathBuf) -> io::Result<Self> {
> + pub(crate) async fn new_full(
> + input: I,
> + path: PathBuf,
> + eof_after_entry: bool,
> + ) -> io::Result<Self> {
> let this = DecoderImpl {
> input,
> current_header: unsafe { mem::zeroed() },
> @@ -210,6 +218,7 @@ impl<I: SeqRead> DecoderImpl<I> {
> path_lengths: Vec::new(),
> state: State::Begin,
> with_goodbye_tables: false,
> + eof_after_entry,
> };
>
> // this.read_next_entry().await?;
> @@ -383,7 +392,14 @@ impl<I: SeqRead> DecoderImpl<I> {
>
> self.current_header = unsafe { mem::zeroed() };
>
> - while self.read_next_item().await? != ItemResult::Entry {}
> + loop {
> + match self.read_next_item_or_eof().await? {
> + Some(ItemResult::Entry) => break,
> + Some(ItemResult::Attribute) => continue,
> + None if self.eof_after_entry => break,
> + None => io_bail!("unexpected EOF in entry"),
> + }
> + }
>
> if self.entry.is_dir() {
> self.path_lengths
> @@ -402,24 +418,40 @@ impl<I: SeqRead> DecoderImpl<I> {
> .ok_or_else(|| io_format_err!("unexpected EOF"))
> }
>
> + async fn read_next_item(&mut self) -> io::Result<ItemResult> {
> + match self.read_next_item_or_eof().await? {
> + Some(item) => Ok(item),
> + None => io_bail!("unexpected EOF"),
> + }
> + }
> +
> + // NOTE: The random accessor will decode FIFOs and Sockets in a decoder instance with a ranged
> + // reader so there is no PAYLOAD or GOODBYE TABLE to "end" an entry.
> + //
> // NOTE: This behavior method is also recreated in the accessor's `get_decoder_at_filename`
> // function! Keep in mind when changing!
> - async fn read_next_item(&mut self) -> io::Result<ItemResult> {
> - self.read_next_header().await?;
> - self.read_current_item().await
> + async fn read_next_item_or_eof(&mut self) -> io::Result<Option<ItemResult>> {
> + match self.read_next_header_or_eof().await? {
> + Some(()) => self.read_current_item().await.map(Some),
> + None => Ok(None),
> + }
> }
>
> - async fn read_next_header(&mut self) -> io::Result<()> {
> + async fn read_next_header_or_eof(&mut self) -> io::Result<Option<()>> {
> let dest = unsafe {
> std::slice::from_raw_parts_mut(
> &mut self.current_header as *mut Header as *mut u8,
> size_of_val(&self.current_header),
> )
> };
> - seq_read_exact(&mut self.input, dest).await?;
> - self.current_header.check_header_size()?;
>
> - Ok(())
> + match seq_read_exact_or_eof(&mut self.input, dest).await? {
> + Some(()) => {
> + self.current_header.check_header_size()?;
> + Ok(Some(()))
> + }
> + None => Ok(None),
> + }
> }
>
> /// Read the next item, the header is already loaded.
> diff --git a/tests/simple/main.rs b/tests/simple/main.rs
> index c73ca10..f15a0f5 100644
> --- a/tests/simple/main.rs
> +++ b/tests/simple/main.rs
> @@ -42,6 +42,9 @@ fn test1() {
>
> assert!(!file.is_empty(), "encoder did not write any data");
>
> + // may be useful for testing...
> + // std::fs::write("myarchive.pxar", &file).expect("failed to write out test archive");
> +
> let mut input = &file[..];
> let mut decoder = decoder::Decoder::from_std(&mut input).expect("failed to create decoder");
> let decoded_fs =
> @@ -53,6 +56,7 @@ fn test1() {
> .expect("failed to create random access reader for encoded archive");
>
> check_bunzip2(&accessor);
> + check_run_special_files(&accessor);
> }
>
> fn check_bunzip2(accessor: &accessor::Accessor<&[u8]>) {
> @@ -85,3 +89,45 @@ fn check_bunzip2(accessor: &accessor::Accessor<&[u8]>) {
>
> assert_eq!(content, "This is the bzip2 executable");
> }
> +
> +fn check_run_special_files(accessor: &accessor::Accessor<&[u8]>) {
> + let rundir = accessor
> + .open_root()
> + .expect("failed to open root of encoded archive")
> + .lookup("run")
> + .expect("failed to open /run in encoded archive")
> + .expect("missing /run in encoded archive")
> + .enter_directory()
> + .expect("expected /run to be a directory in the test archive");
> +
> + assert_eq!(rundir.entry_count(), 2, "expected 2 entries in /run");
> +
> + let mut rd = rundir.read_dir();
> + let fifo0 = rd
> + .next()
> + .expect("expected 'fifo0' entry in rundir")
> + .expect("failed to get first (fifo0) entry in test archive /run directory");
> + assert_eq!(
> + fifo0.file_name(),
> + Path::new("fifo0"),
> + "expected first file in /run to be fifo0"
> + );
> +
> + let _entry = fifo0
> + .decode_entry()
> + .expect("failed to decode entry for fifo0");
> +
> + let sock0 = rd
> + .next()
> + .expect("expected 'sock0' entry in rundir")
> + .expect("failed to get second (sock0) entry in test archive /run directory");
> + assert_eq!(
> + sock0.file_name(),
> + Path::new("sock0"),
> + "expected second file in /run to be sock0"
> + );
> +
> + let _entry = sock0
> + .decode_entry()
> + .expect("failed to decode entry for sock0");
> +}
>
More information about the pbs-devel
mailing list