1
0
Fork 0
mirror of https://codeberg.org/icewind/bitbuffer.git synced 2026-06-03 08:34:07 +02:00

fix pos when reading malformed utf8

This commit is contained in:
Robin Appelman 2020-12-06 21:20:33 +01:00
commit 4d2ea4ee7c
5 changed files with 38 additions and 10 deletions

View file

@ -1,6 +1,6 @@
[package]
name = "bitbuffer"
version = "0.8.0"
version = "0.8.1"
authors = ["Robin Appelman <robin@icewind.nl>"]
edition = "2018"
description = "Reading bit sequences from a byte slice"

View file

@ -125,7 +125,7 @@ pub enum BitError {
},
/// The read slice of bytes are not valid utf8
#[error(display = "The read slice of bytes are not valid utf8: {}", _0)]
Utf8Error(#[error(source)] Utf8Error),
Utf8Error(Utf8Error, usize),
/// The string that was requested to be written does not fit in the specified fixed length
#[error(
display = "The string that was requested to be written does not fit in the specified fixed length, string is {} bytes long, while a size of {} has been specified",
@ -142,7 +142,7 @@ pub enum BitError {
impl From<FromUtf8Error> for BitError {
fn from(err: FromUtf8Error) -> Self {
BitError::from(err.utf8_error())
BitError::Utf8Error(err.utf8_error(), err.as_bytes().len())
}
}

View file

@ -587,9 +587,11 @@ where
.trim_end_matches(char::from(0))
.to_string(),
),
Cow::Borrowed(bytes) => {
Cow::Borrowed(std::str::from_utf8(bytes)?.trim_end_matches(char::from(0)))
}
Cow::Borrowed(bytes) => Cow::Borrowed(
std::str::from_utf8(bytes)
.map_err(|err| BitError::Utf8Error(err, bytes.len()))?
.trim_end_matches(char::from(0)),
),
};
Ok(string)
}
@ -597,7 +599,10 @@ where
let bytes = self.read_string_bytes(position)?;
let string = match bytes {
Cow::Owned(bytes) => Cow::Owned(String::from_utf8(bytes)?),
Cow::Borrowed(bytes) => Cow::Borrowed(std::str::from_utf8(bytes)?),
Cow::Borrowed(bytes) => Cow::Borrowed(
std::str::from_utf8(bytes)
.map_err(|err| BitError::Utf8Error(err, bytes.len()))?,
),
};
Ok(string)
}

View file

@ -306,10 +306,10 @@ where
let result = self.buffer.read_string(self.pos, byte_len).map_err(|err| {
// still advance the stream on malformed utf8
if let BitError::Utf8Error(err) = &err {
if let BitError::Utf8Error(_, len) = &err {
self.pos += match byte_len {
Some(len) => len * 8,
None => min((err.valid_up_to() + 1) * 8, max_length),
None => min((len + 1) * 8, max_length * 8),
};
}
err

View file

@ -3,7 +3,7 @@ use std::num::NonZeroU16;
use maplit::hashmap;
use bitbuffer::{BigEndian, BitRead, BitReadBuffer, BitReadStream, LittleEndian};
use bitbuffer::{BigEndian, BitError, BitRead, BitReadBuffer, BitReadStream, LittleEndian};
const BYTES: &'static [u8] = &[
0b1011_0101,
@ -473,3 +473,26 @@ fn test_to_owned_stream() {
assert_eq!(stream.bit_len(), owned.bit_len());
assert_eq!(stream.bits_left(), owned.bits_left());
}
#[test]
fn test_invalid_utf8() {
let bytes = vec![b'b', b'a', 129, b'c', 0, 0, 0];
let buffer = BitReadBuffer::new(&bytes, LittleEndian);
let mut stream = BitReadStream::new(buffer.clone());
assert!(matches!(
stream.read_string(None),
Err(BitError::Utf8Error(_, 4))
));
assert_eq!(stream.pos(), 5 * 8);
let mut stream = BitReadStream::new(buffer);
assert!(matches!(
stream.read_string(Some(6)),
Err(BitError::Utf8Error(_, 6))
));
assert_eq!(stream.pos(), 6 * 8);
}