use num_bigint::BigUint;
use std::io::Write;
use std::mem;
use crate::data_source::IonDataSource;
use crate::result::{decoding_error, IonResult};
use crate::types::{Int, UInt};
const UINT_STACK_BUFFER_SIZE: usize = 16;
const MAX_UINT_SIZE_IN_BYTES: usize = 2048;
#[derive(Debug)]
pub struct DecodedUInt {
size_in_bytes: usize,
value: UInt,
}
impl DecodedUInt {
pub(crate) fn new(value: UInt, size_in_bytes: usize) -> Self {
DecodedUInt {
size_in_bytes,
value,
}
}
pub(crate) fn small_uint_from_slice(uint_bytes: &[u8]) -> u64 {
let mut magnitude: u64 = 0;
for &byte in uint_bytes {
let byte = u64::from(byte);
magnitude <<= 8;
magnitude |= byte;
}
magnitude
}
pub(crate) fn big_uint_from_slice(uint_bytes: &[u8]) -> BigUint {
BigUint::from_bytes_be(uint_bytes)
}
pub fn read<R: IonDataSource>(data_source: &mut R, length: usize) -> IonResult<DecodedUInt> {
if length > MAX_UINT_SIZE_IN_BYTES {
return decoding_error(format!(
"Found a {length}-byte UInt. Max supported size is {MAX_UINT_SIZE_IN_BYTES} bytes."
));
}
if length <= UINT_STACK_BUFFER_SIZE {
let buffer = &mut [0u8; UINT_STACK_BUFFER_SIZE];
DecodedUInt::read_using_buffer(data_source, length, buffer)
} else {
let mut buffer = vec![0u8; length];
DecodedUInt::read_using_buffer(data_source, length, buffer.as_mut_slice())
}
}
fn read_using_buffer<R: IonDataSource>(
data_source: &mut R,
length: usize,
buffer: &mut [u8],
) -> IonResult<DecodedUInt> {
let buffer = &mut buffer[0..length];
data_source.read_exact(buffer)?;
let value = if length <= mem::size_of::<u64>() {
let mut magnitude: u64 = 0;
for &byte in buffer.iter() {
let byte = u64::from(byte);
magnitude <<= 8;
magnitude |= byte;
}
UInt::U64(magnitude)
} else {
let magnitude = BigUint::from_bytes_be(buffer);
UInt::BigUInt(magnitude)
};
Ok(DecodedUInt {
size_in_bytes: length,
value,
})
}
pub fn write_u64<W: Write>(sink: &mut W, magnitude: u64) -> IonResult<usize> {
let encoded = encode_u64(magnitude);
let bytes_to_write = encoded.as_ref();
sink.write_all(bytes_to_write)?;
Ok(bytes_to_write.len())
}
#[inline(always)]
pub fn value(&self) -> &UInt {
&self.value
}
#[inline(always)]
pub fn size_in_bytes(&self) -> usize {
self.size_in_bytes
}
}
impl From<DecodedUInt> for Int {
fn from(uint: DecodedUInt) -> Self {
let DecodedUInt {
value,
.. } = uint;
Int::from(value)
}
}
#[derive(Clone, Debug, PartialEq, Eq)]
pub enum UIntBeBytes {
Stack([u8; mem::size_of::<u64>()]),
Heap(Vec<u8>),
}
#[derive(Clone, Debug, PartialEq, Eq)]
pub struct EncodedUInt {
be_bytes: UIntBeBytes,
first_occupied_byte: usize,
}
impl EncodedUInt {
pub fn as_bytes(&self) -> &[u8] {
match self.be_bytes {
UIntBeBytes::Stack(ref byte_array) => &byte_array[self.first_occupied_byte..],
UIntBeBytes::Heap(ref byte_vec) => &byte_vec[self.first_occupied_byte..],
}
}
}
impl AsRef<[u8]> for EncodedUInt {
fn as_ref(&self) -> &[u8] {
self.as_bytes()
}
}
pub fn encode_u64(magnitude: u64) -> EncodedUInt {
let empty_leading_bytes: u32 = magnitude.leading_zeros() / 8;
let first_occupied_byte = empty_leading_bytes as usize;
let magnitude_bytes: [u8; mem::size_of::<u64>()] = magnitude.to_be_bytes();
EncodedUInt {
be_bytes: UIntBeBytes::Stack(magnitude_bytes),
first_occupied_byte,
}
}
pub fn encode_uint(magnitude: &UInt) -> EncodedUInt {
let magnitude: &BigUint = match magnitude {
UInt::U64(m) => return encode_u64(*m),
UInt::BigUInt(m) => m,
};
let be_bytes = UIntBeBytes::Heap(magnitude.to_bytes_be());
let first_occupied_byte = 0;
EncodedUInt {
be_bytes,
first_occupied_byte,
}
}
#[cfg(test)]
mod tests {
use super::*;
use num_traits::Num;
use std::io::Cursor;
const READ_ERROR_MESSAGE: &str = "Failed to read a UInt from the provided cursor.";
const WRITE_ERROR_MESSAGE: &str = "Writing a UInt to the provided sink failed.";
#[test]
fn test_read_one_byte_uint() {
let data = &[0b1000_0000];
let uint = DecodedUInt::read(&mut Cursor::new(data), data.len()).expect(READ_ERROR_MESSAGE);
assert_eq!(uint.size_in_bytes(), 1);
assert_eq!(uint.value(), &UInt::U64(128));
}
#[test]
fn test_read_two_byte_uint() {
let data = &[0b0111_1111, 0b1111_1111];
let uint = DecodedUInt::read(&mut Cursor::new(data), data.len()).expect(READ_ERROR_MESSAGE);
assert_eq!(uint.size_in_bytes(), 2);
assert_eq!(uint.value(), &UInt::U64(32_767));
}
#[test]
fn test_read_three_byte_uint() {
let data = &[0b0011_1100, 0b1000_0111, 0b1000_0001];
let uint = DecodedUInt::read(&mut Cursor::new(data), data.len()).expect(READ_ERROR_MESSAGE);
assert_eq!(uint.size_in_bytes(), 3);
assert_eq!(uint.value(), &UInt::U64(3_966_849));
}
#[test]
fn test_read_ten_byte_uint() {
let data = vec![0xFFu8; 10];
let uint = DecodedUInt::read(&mut Cursor::new(data.as_slice()), data.len())
.expect(READ_ERROR_MESSAGE);
assert_eq!(uint.size_in_bytes(), 10);
assert_eq!(
uint.value(),
&UInt::BigUInt(BigUint::from_str_radix("ffffffffffffffffffff", 16).unwrap())
);
}
#[test]
fn test_read_uint_too_large() {
let mut buffer = Vec::with_capacity(MAX_UINT_SIZE_IN_BYTES + 1);
buffer.resize(MAX_UINT_SIZE_IN_BYTES + 1, 1);
let data = buffer.as_slice();
let _uint = DecodedUInt::read(&mut Cursor::new(data), data.len())
.expect_err("This exceeded the configured max UInt size.");
}
#[test]
fn test_write_ten_byte_uint() {
let value = UInt::BigUInt(BigUint::from_str_radix("ffffffffffffffffffff", 16).unwrap());
let mut buffer: Vec<u8> = vec![];
let encoded = super::encode_uint(&value);
buffer.write_all(encoded.as_bytes()).unwrap();
let expected_bytes = vec![0xFFu8; 10];
assert_eq!(expected_bytes.as_slice(), buffer.as_slice());
}
#[test]
fn test_write_eight_byte_uint() {
let value = 0x01_23_45_67_89_AB_CD_EF;
let mut buffer: Vec<u8> = vec![];
DecodedUInt::write_u64(&mut buffer, value).expect(WRITE_ERROR_MESSAGE);
let expected_bytes = &[0x01, 0x23, 0x45, 0x67, 0x89, 0xAB, 0xCD, 0xEF];
assert_eq!(expected_bytes, buffer.as_slice());
}
#[test]
fn test_write_five_byte_uint() {
let value = 0x01_23_45_67_89;
let mut buffer: Vec<u8> = vec![];
DecodedUInt::write_u64(&mut buffer, value).expect(WRITE_ERROR_MESSAGE);
let expected_bytes = &[0x01, 0x23, 0x45, 0x67, 0x89];
assert_eq!(expected_bytes, buffer.as_slice());
}
#[test]
fn test_write_three_byte_uint() {
let value = 0x01_23_45;
let mut buffer: Vec<u8> = vec![];
DecodedUInt::write_u64(&mut buffer, value).expect(WRITE_ERROR_MESSAGE);
let expected_bytes: &[u8] = &[0x01, 0x23, 0x45];
assert_eq!(expected_bytes, buffer.as_slice());
}
#[test]
fn test_write_uint_zero() {
let value = 0x00;
let mut buffer: Vec<u8> = vec![];
DecodedUInt::write_u64(&mut buffer, value).expect(WRITE_ERROR_MESSAGE);
let expected_bytes: &[u8] = &[];
assert_eq!(expected_bytes, buffer.as_slice());
}
}