- let magic: [u8; 4] = read_bytes(&mut r)?;
- let (is_zsav, is_ebcdic) = match &magic {
- ASCII_MAGIC => (false, false),
- ASCII_ZMAGIC => (true, false),
- EBCDIC_MAGIC => (false, true),
- _ => return Err(Error::NotASystemFile),
- };
-
- let eye_catcher: [u8; 60] = read_bytes(&mut r)?;
- let layout_code: [u8; 4] = read_bytes(&mut r)?;
- let endianness = Endian::identify_u32(2, layout_code)
- .or_else(|| Endian::identify_u32(2, layout_code))
- .ok_or_else(|| Error::NotASystemFile)?;
-
- let nominal_case_size: u32 = endianness.parse(read_bytes(&mut r)?);
- let nominal_case_size = (nominal_case_size <= u32::MAX / 32).then_some(nominal_case_size);
-
- let compression_code: u32 = endianness.parse(read_bytes(&mut r)?);
- let compression = match (is_zsav, compression_code) {
- (false, 0) => None,
- (false, 1) => Some(Compression::Simple),
- (true, 2) => Some(Compression::ZLib),
- (false, code) => return Err(Error::InvalidSavCompression(code)),
- (true, code) => return Err(Error::InvalidZsavCompression(code)),
- };
-
- let weight_index: u32 = endianness.parse(read_bytes(&mut r)?);
- let weight_index = (weight_index > 0).then_some(weight_index - 1);
-
- let n_cases: u32 = endianness.parse(read_bytes(&mut r)?);
- let n_cases = (n_cases <= u32::MAX / 4).then_some(n_cases);
-
- let bias: f64 = endianness.parse(read_bytes(&mut r)?);
- if bias != 100.0 {
- warn(Warning::UnexpectedBias(bias))
+ let header = read_header(&mut r, &warn)?;
+ let e = header.endianness;
+ let mut document_record = None;
+ let mut variables = Vec::new();
+ loop {
+ let rec_type: u32 = e.parse(read_bytes(&mut r)?);
+ match rec_type {
+ 2 => variables.push(read_variable_record(&mut r, e)?),
+ /*
+ 3 => d.read_value_label_record()?,
+ */
+ // A Type 4 record is always immediately after a type 3 record,
+ // the code for type 3 records reads the type 4 record too.
+ 4 => return Err(Error::MisplacedType4Record),
+
+ 6 => {
+ let d = read_document_record(&mut r, e)?;
+ if document_record.is_some() {
+ warn(Warning::DuplicateDocumentRecord);
+ } else {
+ document_record = d;
+ }
+ }
+ /*
+ 7 => d.read_extension_record()?,
+ */
+ 999 => break,
+ _ => return Err(Error::BadRecordType(rec_type)),
+ }
+ }
+
+ Ok(Reader { r, document_record })
+ }
+}
+
+fn read_header<R: Read>(r: &mut R, warn: impl Fn(Warning)) -> Result<FileHeader, Error> {
+ let magic: [u8; 4] = read_bytes(r)?;
+ let (is_zsav, is_ebcdic) = match &magic {
+ ASCII_MAGIC => (false, false),
+ ASCII_ZMAGIC => (true, false),
+ EBCDIC_MAGIC => (false, true),
+ _ => return Err(Error::NotASystemFile),
+ };
+
+ let eye_catcher: [u8; 60] = read_bytes(r)?;
+ let layout_code: [u8; 4] = read_bytes(r)?;
+ let endianness = Endian::identify_u32(2, layout_code)
+ .or_else(|| Endian::identify_u32(2, layout_code))
+ .ok_or_else(|| Error::NotASystemFile)?;
+
+ let nominal_case_size: u32 = endianness.parse(read_bytes(r)?);
+ let nominal_case_size =
+ (nominal_case_size <= i32::MAX as u32 / 16).then_some(nominal_case_size);
+
+ let compression_code: u32 = endianness.parse(read_bytes(r)?);
+ let compression = match (is_zsav, compression_code) {
+ (false, 0) => None,
+ (false, 1) => Some(Compression::Simple),
+ (true, 2) => Some(Compression::ZLib),
+ (false, code) => return Err(Error::InvalidSavCompression(code)),
+ (true, code) => return Err(Error::InvalidZsavCompression(code)),
+ };
+
+ let weight_index: u32 = endianness.parse(read_bytes(r)?);
+ let weight_index = (weight_index > 0).then_some(weight_index - 1);
+
+ let n_cases: u32 = endianness.parse(read_bytes(r)?);
+ let n_cases = (n_cases < i32::MAX as u32 / 2).then_some(n_cases);
+
+ let bias: f64 = endianness.parse(read_bytes(r)?);
+ if bias != 100.0 {
+ warn(Warning::UnexpectedBias(bias))
+ }
+
+ let creation_date: [u8; 9] = read_bytes(r)?;
+ let creation_time: [u8; 8] = read_bytes(r)?;
+ let file_label: [u8; 64] = read_bytes(r)?;
+ let _: [u8; 3] = read_bytes(r)?;
+
+ Ok(FileHeader {
+ magic,
+ is_zsav,
+ is_ebcdic,
+ endianness,
+ weight_index,
+ nominal_case_size,
+ creation_date,
+ creation_time,
+ eye_catcher,
+ file_label,
+ })
+}
+
+pub struct VariableRecord {
+ /// Offset from the start of the file to the start of the record.
+ pub pos: u64,
+
+ /// Variable width, in the range -1..=255.
+ pub width: i32,
+
+ /// Variable name, padded on the right with spaces.
+ pub name: [u8; 8],
+
+ /// Print format.
+ pub print_format: u32,
+
+ /// Write format.
+ pub write_format: u32,
+
+ /// Missing value code, one of -3, -2, 0, 1, 2, or 3.
+ pub missing_value_code: i32,
+
+ /// Raw missing values, up to 3 of them.
+ pub missing: Vec<[u8; 8]>,
+
+ /// Optional variable label.
+ pub label: Option<Vec<u8>>,
+}
+
+fn read_variable_record<R: Read + Seek>(
+ r: &mut BufReader<R>,
+ e: Endian,
+) -> Result<VariableRecord, Error> {
+ let pos = r.stream_position()?;
+ let width: i32 = e.parse(read_bytes(r)?);
+ let has_variable_label: u32 = e.parse(read_bytes(r)?);
+ let missing_value_code: i32 = e.parse(read_bytes(r)?);
+ let print_format: u32 = e.parse(read_bytes(r)?);
+ let write_format: u32 = e.parse(read_bytes(r)?);
+ let name: [u8; 8] = read_bytes(r)?;
+
+ let label = match has_variable_label {
+ 0 => None,
+ 1 => {
+ let len: u32 = e.parse(read_bytes(r)?);
+ let read_len = len.min(65535) as usize;
+ let label = Some(read_vec(r, read_len)?);
+
+ let padding_bytes = Integer::next_multiple_of(&len, &4) - len;
+ let _ = read_vec(r, padding_bytes as usize)?;
+
+ label
+ }
+ _ => return Err(Error::BadVariableLabelIndicator(has_variable_label)),
+ };
+
+ let mut missing = Vec::new();
+ if missing_value_code != 0 {
+ match (width, missing_value_code) {
+ (0, -3 | -2 | 1 | 2 | 3) => (),
+ (0, _) => return Err(Error::BadNumericMissingValueIndicator(missing_value_code)),
+ (_, 0..=3) => (),
+ (_, _) => return Err(Error::BadStringMissingValueIndicator(missing_value_code)),