diff --git a/src/read.rs b/src/read.rs index c5ea5397..a03763a2 100644 --- a/src/read.rs +++ b/src/read.rs @@ -54,6 +54,7 @@ pub struct ZipArchive reader: R, files: Vec, names_map: HashMap, + offset: u32, } enum ZipFileReader<'a> { @@ -78,11 +79,15 @@ impl ZipArchive { /// Opens a Zip archive and parses the central directory pub fn new(mut reader: R) -> ZipResult> { - let footer = try!(spec::CentralDirectoryEnd::find_and_parse(&mut reader)); + let (footer, cde_start_pos) = try!(spec::CentralDirectoryEnd::find_and_parse(&mut reader)); if footer.disk_number != footer.disk_with_central_directory { return unsupported_zip_error("Support for multi-disk files is not implemented") } - let directory_start = footer.central_directory_offset as u64; + // Some zip files have data prepended to them, resulting in the offsets all being too small. Get the amount of + // error by comparing the actual file position we found the CDE at with the offset recorded in the CDE. + let archive_offset = cde_start_pos - footer.central_directory_size - footer.central_directory_offset; + + let directory_start = (footer.central_directory_offset + archive_offset) as u64; let number_of_files = footer.number_of_files_on_this_disk as usize; let mut files = Vec::with_capacity(number_of_files); @@ -91,12 +96,17 @@ impl ZipArchive try!(reader.seek(io::SeekFrom::Start(directory_start))); for _ in 0 .. number_of_files { - let file = try!(central_header_to_zip_file(&mut reader)); + let file = try!(central_header_to_zip_file(&mut reader, archive_offset)); names_map.insert(file.file_name.clone(), files.len()); files.push(file); } - Ok(ZipArchive { reader: reader, files: files, names_map: names_map }) + Ok(ZipArchive { + reader: reader, + files: files, + names_map: names_map, + offset: archive_offset, + }) } /// Number of files contained in this zip. @@ -116,6 +126,14 @@ impl ZipArchive self.files.len() } + /// Get the offset from the beginning of the underlying reader that this zip begins at, in bytes. + /// + /// Normally this value is zero, but if the zip has arbitrary data prepended to it, then this value will be the size + /// of that prepended data. + pub fn offset(&self) -> u32 { + self.offset + } + /// Search for a file entry by name pub fn by_name<'a>(&'a mut self, name: &str) -> ZipResult> { @@ -178,7 +196,7 @@ impl ZipArchive } } -fn central_header_to_zip_file(reader: &mut R) -> ZipResult +fn central_header_to_zip_file(reader: &mut R, archive_offset: u32) -> ZipResult { // Parse central header let signature = try!(reader.read_u32::()); @@ -204,11 +222,14 @@ fn central_header_to_zip_file(reader: &mut R) -> ZipResult()); let _internal_file_attributes = try!(reader.read_u16::()); let external_file_attributes = try!(reader.read_u32::()); - let offset = try!(reader.read_u32::()) as u64; + let mut offset = try!(reader.read_u32::()) as u64; let file_name_raw = try!(ReadPodExt::read_exact(reader, file_name_length)); let extra_field = try!(ReadPodExt::read_exact(reader, extra_field_length)); let file_comment_raw = try!(ReadPodExt::read_exact(reader, file_comment_length)); + // Account for shifted zip offsets. + offset += archive_offset as u64; + let file_name = match is_utf8 { true => String::from_utf8_lossy(&*file_name_raw).into_owned(), diff --git a/src/spec.rs b/src/spec.rs index bce23f88..ff3cbcde 100644 --- a/src/spec.rs +++ b/src/spec.rs @@ -48,7 +48,7 @@ impl CentralDirectoryEnd }) } - pub fn find_and_parse(reader: &mut T) -> ZipResult + pub fn find_and_parse(reader: &mut T) -> ZipResult<(CentralDirectoryEnd, u32)> { let header_size = 22; let bytes_between_magic_and_comment_size = header_size - 6; @@ -66,8 +66,8 @@ impl CentralDirectoryEnd let comment_length = try!(reader.read_u16::()) as i64; if file_length - pos - header_size == comment_length { - try!(reader.seek(io::SeekFrom::Start(pos as u64))); - return CentralDirectoryEnd::parse(reader); + let cde_start_pos = try!(reader.seek(io::SeekFrom::Start(pos as u64))) as u32; + return CentralDirectoryEnd::parse(reader).map(|cde| (cde, cde_start_pos)); } } pos -= 1;