use std::{cmp, mem::size_of};
use bytes::Bytes;
use crate::errors::{ParquetError, Result};
use crate::util::bit_util::{self, BitReader, BitWriter, FromBytes};
const MAX_GROUPS_PER_BIT_PACKED_RUN: usize = 1 << 6;
pub struct RleEncoder {
bit_width: u8,
bit_writer: BitWriter,
buffered_values: [u64; 8],
num_buffered_values: usize,
current_value: u64,
repeat_count: usize,
bit_packed_count: usize,
indicator_byte_pos: i64,
}
impl RleEncoder {
#[allow(unused)]
pub fn new(bit_width: u8, buffer_len: usize) -> Self {
let buffer = Vec::with_capacity(buffer_len);
RleEncoder::new_from_buf(bit_width, buffer)
}
pub fn new_from_buf(bit_width: u8, buffer: Vec<u8>) -> Self {
let bit_writer = BitWriter::new_from_buf(buffer);
RleEncoder {
bit_width,
bit_writer,
buffered_values: [0; 8],
num_buffered_values: 0,
current_value: 0,
repeat_count: 0,
bit_packed_count: 0,
indicator_byte_pos: -1,
}
}
pub fn max_buffer_size(bit_width: u8, num_values: usize) -> usize {
let num_runs = bit_util::ceil(num_values, 8);
let bytes_per_run = bit_width as usize;
let bit_packed_max_size = num_runs + num_runs * bytes_per_run;
let rle_len_prefix = 1;
let min_rle_run_size = rle_len_prefix + bit_util::ceil(bit_width as usize, 8);
let rle_max_size = num_runs * min_rle_run_size;
bit_packed_max_size.max(rle_max_size)
}
#[inline]
pub fn put(&mut self, value: u64) {
if self.current_value == value {
self.repeat_count += 1;
if self.repeat_count > 8 {
return;
}
} else {
if self.repeat_count >= 8 {
assert_eq!(self.bit_packed_count, 0);
self.flush_rle_run();
}
self.repeat_count = 1;
self.current_value = value;
}
self.buffered_values[self.num_buffered_values] = value;
self.num_buffered_values += 1;
if self.num_buffered_values == 8 {
assert_eq!(self.bit_packed_count % 8, 0);
self.flush_buffered_values();
}
}
#[inline]
#[allow(unused)]
pub fn buffer(&self) -> &[u8] {
self.bit_writer.buffer()
}
#[inline]
pub fn len(&self) -> usize {
self.bit_writer.bytes_written()
}
#[allow(unused)]
pub fn is_empty(&self) -> bool {
self.bit_writer.bytes_written() == 0
}
#[inline]
pub fn consume(mut self) -> Vec<u8> {
self.flush();
self.bit_writer.consume()
}
#[inline]
#[allow(unused)]
pub fn flush_buffer(&mut self) -> &[u8] {
self.flush();
self.bit_writer.flush_buffer()
}
#[inline]
#[allow(unused)]
pub fn clear(&mut self) {
self.bit_writer.clear();
self.num_buffered_values = 0;
self.current_value = 0;
self.repeat_count = 0;
self.bit_packed_count = 0;
self.indicator_byte_pos = -1;
}
#[inline]
pub fn flush(&mut self) {
if self.bit_packed_count > 0 || self.repeat_count > 0 || self.num_buffered_values > 0 {
let all_repeat = self.bit_packed_count == 0
&& (self.repeat_count == self.num_buffered_values || self.num_buffered_values == 0);
if self.repeat_count > 0 && all_repeat {
self.flush_rle_run();
} else {
if self.num_buffered_values > 0 {
while self.num_buffered_values < 8 {
self.buffered_values[self.num_buffered_values] = 0;
self.num_buffered_values += 1;
}
}
self.bit_packed_count += self.num_buffered_values;
self.flush_bit_packed_run(true);
self.repeat_count = 0;
}
}
}
fn flush_rle_run(&mut self) {
assert!(self.repeat_count > 0);
let indicator_value = self.repeat_count << 1;
self.bit_writer.put_vlq_int(indicator_value as u64);
self.bit_writer.put_aligned(
self.current_value,
bit_util::ceil(self.bit_width as usize, 8),
);
self.num_buffered_values = 0;
self.repeat_count = 0;
}
fn flush_bit_packed_run(&mut self, update_indicator_byte: bool) {
if self.indicator_byte_pos < 0 {
self.indicator_byte_pos = self.bit_writer.skip(1) as i64;
}
for i in 0..self.num_buffered_values {
self.bit_writer
.put_value(self.buffered_values[i], self.bit_width as usize);
}
self.num_buffered_values = 0;
if update_indicator_byte {
let num_groups = self.bit_packed_count / 8;
let indicator_byte = ((num_groups << 1) | 1) as u8;
self.bit_writer
.put_aligned_offset(indicator_byte, 1, self.indicator_byte_pos as usize);
self.indicator_byte_pos = -1;
self.bit_packed_count = 0;
}
}
#[inline(never)]
fn flush_buffered_values(&mut self) {
if self.repeat_count >= 8 {
self.num_buffered_values = 0;
if self.bit_packed_count > 0 {
assert_eq!(self.bit_packed_count % 8, 0);
self.flush_bit_packed_run(true)
}
return;
}
self.bit_packed_count += self.num_buffered_values;
let num_groups = self.bit_packed_count / 8;
if num_groups + 1 >= MAX_GROUPS_PER_BIT_PACKED_RUN {
assert!(self.indicator_byte_pos >= 0);
self.flush_bit_packed_run(true);
} else {
self.flush_bit_packed_run(false);
}
self.repeat_count = 0;
}
pub(crate) fn estimated_memory_size(&self) -> usize {
self.bit_writer.estimated_memory_size() + std::mem::size_of::<Self>()
}
}
const RLE_DECODER_INDEX_BUFFER_SIZE: usize = 1024;
pub struct RleDecoder {
bit_width: u8,
bit_reader: Option<BitReader>,
index_buf: Option<Box<[i32; RLE_DECODER_INDEX_BUFFER_SIZE]>>,
rle_left: u32,
bit_packed_left: u32,
current_value: Option<u64>,
}
impl RleDecoder {
pub fn new(bit_width: u8) -> Self {
RleDecoder {
bit_width,
rle_left: 0,
bit_packed_left: 0,
bit_reader: None,
index_buf: None,
current_value: None,
}
}
#[inline]
pub fn set_data(&mut self, data: Bytes) {
if let Some(ref mut bit_reader) = self.bit_reader {
bit_reader.reset(data);
} else {
self.bit_reader = Some(BitReader::new(data));
}
let _ = self.reload();
}
#[inline(never)]
#[allow(unused)]
pub fn get<T: FromBytes>(&mut self) -> Result<Option<T>> {
assert!(size_of::<T>() <= 8);
while self.rle_left == 0 && self.bit_packed_left == 0 {
if !self.reload() {
return Ok(None);
}
}
let value = if self.rle_left > 0 {
let rle_value = T::try_from_le_slice(
&self
.current_value
.as_mut()
.expect("current_value should be Some")
.to_ne_bytes(),
)?;
self.rle_left -= 1;
rle_value
} else {
let bit_reader = self.bit_reader.as_mut().expect("bit_reader should be Some");
let bit_packed_value = bit_reader
.get_value(self.bit_width as usize)
.ok_or_else(|| eof_err!("Not enough data for 'bit_packed_value'"))?;
self.bit_packed_left -= 1;
bit_packed_value
};
Ok(Some(value))
}
#[inline(never)]
pub fn get_batch<T: FromBytes>(&mut self, buffer: &mut [T]) -> Result<usize> {
assert!(size_of::<T>() <= 8);
let mut values_read = 0;
while values_read < buffer.len() {
if self.rle_left > 0 {
let num_values = cmp::min(buffer.len() - values_read, self.rle_left as usize);
for i in 0..num_values {
let repeated_value =
T::try_from_le_slice(&self.current_value.as_mut().unwrap().to_ne_bytes())?;
buffer[values_read + i] = repeated_value;
}
self.rle_left -= num_values as u32;
values_read += num_values;
} else if self.bit_packed_left > 0 {
let mut num_values =
cmp::min(buffer.len() - values_read, self.bit_packed_left as usize);
let bit_reader = self.bit_reader.as_mut().expect("bit_reader should be set");
num_values = bit_reader.get_batch::<T>(
&mut buffer[values_read..values_read + num_values],
self.bit_width as usize,
);
if num_values == 0 {
self.bit_packed_left = 0;
continue;
}
self.bit_packed_left -= num_values as u32;
values_read += num_values;
} else if !self.reload() {
break;
}
}
Ok(values_read)
}
#[inline(never)]
pub fn skip(&mut self, num_values: usize) -> Result<usize> {
let mut values_skipped = 0;
while values_skipped < num_values {
if self.rle_left > 0 {
let num_values = cmp::min(num_values - values_skipped, self.rle_left as usize);
self.rle_left -= num_values as u32;
values_skipped += num_values;
} else if self.bit_packed_left > 0 {
let mut num_values =
cmp::min(num_values - values_skipped, self.bit_packed_left as usize);
let bit_reader = self.bit_reader.as_mut().expect("bit_reader should be set");
num_values = bit_reader.skip(num_values, self.bit_width as usize);
if num_values == 0 {
self.bit_packed_left = 0;
continue;
}
self.bit_packed_left -= num_values as u32;
values_skipped += num_values;
} else if !self.reload() {
break;
}
}
Ok(values_skipped)
}
#[inline(never)]
pub fn get_batch_with_dict<T>(
&mut self,
dict: &[T],
buffer: &mut [T],
max_values: usize,
) -> Result<usize>
where
T: Default + Clone,
{
assert!(buffer.len() >= max_values);
let mut values_read = 0;
while values_read < max_values {
let index_buf = self.index_buf.get_or_insert_with(|| Box::new([0; 1024]));
if self.rle_left > 0 {
let num_values = cmp::min(max_values - values_read, self.rle_left as usize);
let dict_idx = self.current_value.unwrap() as usize;
for i in 0..num_values {
buffer[values_read + i].clone_from(&dict[dict_idx]);
}
self.rle_left -= num_values as u32;
values_read += num_values;
} else if self.bit_packed_left > 0 {
let bit_reader = self.bit_reader.as_mut().expect("bit_reader should be set");
loop {
let to_read = index_buf
.len()
.min(max_values - values_read)
.min(self.bit_packed_left as usize);
if to_read == 0 {
break;
}
let num_values = bit_reader
.get_batch::<i32>(&mut index_buf[..to_read], self.bit_width as usize);
if num_values == 0 {
self.bit_packed_left = 0;
break;
}
for i in 0..num_values {
buffer[values_read + i].clone_from(&dict[index_buf[i] as usize])
}
self.bit_packed_left -= num_values as u32;
values_read += num_values;
if num_values < to_read {
break;
}
}
} else if !self.reload() {
break;
}
}
Ok(values_read)
}
#[inline]
fn reload(&mut self) -> bool {
let bit_reader = self.bit_reader.as_mut().expect("bit_reader should be set");
if let Some(indicator_value) = bit_reader.get_vlq_int() {
if indicator_value == 0 {
return false;
}
if indicator_value & 1 == 1 {
self.bit_packed_left = ((indicator_value >> 1) * 8) as u32;
} else {
self.rle_left = (indicator_value >> 1) as u32;
let value_width = bit_util::ceil(self.bit_width as usize, 8);
self.current_value = bit_reader.get_aligned::<u64>(value_width);
assert!(self.current_value.is_some());
}
true
} else {
false
}
}
}
#[cfg(test)]
mod tests {
use super::*;
use crate::util::bit_util::ceil;
use rand::{self, distributions::Standard, thread_rng, Rng, SeedableRng};
const MAX_WIDTH: usize = 32;
#[test]
fn test_rle_decode_int32() {
let data = vec![0x03, 0x88, 0xC6, 0xFA];
let mut decoder: RleDecoder = RleDecoder::new(3);
decoder.set_data(data.into());
let mut buffer = vec![0; 8];
let expected = vec![0, 1, 2, 3, 4, 5, 6, 7];
let result = decoder.get_batch::<i32>(&mut buffer);
assert!(result.is_ok());
assert_eq!(buffer, expected);
}
#[test]
fn test_rle_skip_int32() {
let data = vec![0x03, 0x88, 0xC6, 0xFA];
let mut decoder: RleDecoder = RleDecoder::new(3);
decoder.set_data(data.into());
let expected = vec![2, 3, 4, 5, 6, 7];
let skipped = decoder.skip(2).expect("skipping values");
assert_eq!(skipped, 2);
let mut buffer = vec![0; 6];
let remaining = decoder
.get_batch::<i32>(&mut buffer)
.expect("getting remaining");
assert_eq!(remaining, 6);
assert_eq!(buffer, expected);
}
#[test]
fn test_rle_consume_flush_buffer() {
let data = vec![1, 1, 1, 2, 2, 3, 3, 3];
let mut encoder1 = RleEncoder::new(3, 256);
let mut encoder2 = RleEncoder::new(3, 256);
for value in data {
encoder1.put(value as u64);
encoder2.put(value as u64);
}
let res1 = encoder1.flush_buffer();
let res2 = encoder2.consume();
assert_eq!(res1, &res2[..]);
}
#[test]
fn test_rle_decode_bool() {
let data1 = vec![0x64, 0x01, 0x64, 0x00];
let data2 = vec![
0x1B, 0xAA, 0xAA, 0xAA, 0xAA, 0xAA, 0xAA, 0xAA, 0xAA, 0xAA, 0xAA, 0xAA, 0xAA, 0x0A,
];
let mut decoder: RleDecoder = RleDecoder::new(1);
decoder.set_data(data1.into());
let mut buffer = vec![false; 100];
let mut expected = vec![];
for i in 0..100 {
if i < 50 {
expected.push(true);
} else {
expected.push(false);
}
}
let result = decoder.get_batch::<bool>(&mut buffer);
assert!(result.is_ok());
assert_eq!(buffer, expected);
decoder.set_data(data2.into());
let mut buffer = vec![false; 100];
let mut expected = vec![];
for i in 0..100 {
if i % 2 == 0 {
expected.push(false);
} else {
expected.push(true);
}
}
let result = decoder.get_batch::<bool>(&mut buffer);
assert!(result.is_ok());
assert_eq!(buffer, expected);
}
#[test]
fn test_rle_skip_bool() {
let data1 = vec![0x64, 0x01, 0x64, 0x00];
let data2 = vec![
0x1B, 0xAA, 0xAA, 0xAA, 0xAA, 0xAA, 0xAA, 0xAA, 0xAA, 0xAA, 0xAA, 0xAA, 0xAA, 0x0A,
];
let mut decoder: RleDecoder = RleDecoder::new(1);
decoder.set_data(data1.into());
let mut buffer = vec![true; 50];
let expected = vec![false; 50];
let skipped = decoder.skip(50).expect("skipping first 50");
assert_eq!(skipped, 50);
let remainder = decoder
.get_batch::<bool>(&mut buffer)
.expect("getting remaining 50");
assert_eq!(remainder, 50);
assert_eq!(buffer, expected);
decoder.set_data(data2.into());
let mut buffer = vec![false; 50];
let mut expected = vec![];
for i in 0..50 {
if i % 2 == 0 {
expected.push(false);
} else {
expected.push(true);
}
}
let skipped = decoder.skip(50).expect("skipping first 50");
assert_eq!(skipped, 50);
let remainder = decoder
.get_batch::<bool>(&mut buffer)
.expect("getting remaining 50");
assert_eq!(remainder, 50);
assert_eq!(buffer, expected);
}
#[test]
fn test_rle_decode_with_dict_int32() {
let dict = vec![10, 20, 30];
let data = vec![0x06, 0x00, 0x08, 0x01, 0x0A, 0x02];
let mut decoder: RleDecoder = RleDecoder::new(3);
decoder.set_data(data.into());
let mut buffer = vec![0; 12];
let expected = vec![10, 10, 10, 20, 20, 20, 20, 30, 30, 30, 30, 30];
let result = decoder.get_batch_with_dict::<i32>(&dict, &mut buffer, 12);
assert!(result.is_ok());
assert_eq!(buffer, expected);
let dict = vec!["aaa", "bbb", "ccc", "ddd", "eee", "fff"];
let data = vec![0x03, 0x63, 0xC7, 0x8E, 0x03, 0x65, 0x0B];
let mut decoder: RleDecoder = RleDecoder::new(3);
decoder.set_data(data.into());
let mut buffer = vec![""; 12];
let expected = vec![
"ddd", "eee", "fff", "ddd", "eee", "fff", "ddd", "eee", "fff", "eee", "fff", "fff",
];
let result =
decoder.get_batch_with_dict::<&str>(dict.as_slice(), buffer.as_mut_slice(), 12);
assert!(result.is_ok());
assert_eq!(buffer, expected);
}
#[test]
fn test_rle_skip_dict() {
let dict = vec![10, 20, 30];
let data = vec![0x06, 0x00, 0x08, 0x01, 0x0A, 0x02];
let mut decoder: RleDecoder = RleDecoder::new(3);
decoder.set_data(data.into());
let mut buffer = vec![0; 10];
let expected = vec![10, 20, 20, 20, 20, 30, 30, 30, 30, 30];
let skipped = decoder.skip(2).expect("skipping two values");
assert_eq!(skipped, 2);
let remainder = decoder
.get_batch_with_dict::<i32>(&dict, &mut buffer, 10)
.expect("getting remainder");
assert_eq!(remainder, 10);
assert_eq!(buffer, expected);
let dict = vec!["aaa", "bbb", "ccc", "ddd", "eee", "fff"];
let data = vec![0x03, 0x63, 0xC7, 0x8E, 0x03, 0x65, 0x0B];
let mut decoder: RleDecoder = RleDecoder::new(3);
decoder.set_data(data.into());
let mut buffer = vec![""; 8];
let expected = vec!["eee", "fff", "ddd", "eee", "fff", "eee", "fff", "fff"];
let skipped = decoder.skip(4).expect("skipping four values");
assert_eq!(skipped, 4);
let remainder = decoder
.get_batch_with_dict::<&str>(dict.as_slice(), buffer.as_mut_slice(), 8)
.expect("getting remainder");
assert_eq!(remainder, 8);
assert_eq!(buffer, expected);
}
fn validate_rle(
values: &[i64],
bit_width: u8,
expected_encoding: Option<&[u8]>,
expected_len: i32,
) {
let buffer_len = 64 * 1024;
let mut encoder = RleEncoder::new(bit_width, buffer_len);
for v in values {
encoder.put(*v as u64)
}
let buffer: Bytes = encoder.consume().into();
if expected_len != -1 {
assert_eq!(buffer.len(), expected_len as usize);
}
if let Some(b) = expected_encoding {
assert_eq!(buffer.as_ref(), b);
}
let mut decoder = RleDecoder::new(bit_width);
decoder.set_data(buffer.clone());
for v in values {
let val: i64 = decoder
.get()
.expect("get() should be OK")
.expect("get() should return more value");
assert_eq!(val, *v);
}
decoder.set_data(buffer);
let mut values_read: Vec<i64> = vec![0; values.len()];
decoder
.get_batch(&mut values_read[..])
.expect("get_batch() should be OK");
assert_eq!(&values_read[..], values);
}
#[test]
fn test_rle_specific_sequences() {
let mut expected_buffer = Vec::new();
let mut values = vec![0; 50];
values.resize(100, 1);
expected_buffer.push(50 << 1);
expected_buffer.push(0);
expected_buffer.push(50 << 1);
expected_buffer.push(1);
for width in 1..9 {
validate_rle(&values[..], width, Some(&expected_buffer[..]), 4);
}
for width in 9..MAX_WIDTH + 1 {
validate_rle(
&values[..],
width as u8,
None,
2 * (1 + bit_util::ceil(width as i64, 8) as i32),
);
}
values.clear();
expected_buffer.clear();
for i in 0..101 {
values.push(i % 2);
}
let num_groups = bit_util::ceil(100, 8) as u8;
expected_buffer.push((num_groups << 1) | 1);
expected_buffer.resize(expected_buffer.len() + 100 / 8, 0b10101010);
expected_buffer.push(0b00001010);
validate_rle(
&values,
1,
Some(&expected_buffer[..]),
1 + num_groups as i32,
);
for width in 2..MAX_WIDTH + 1 {
let num_values = bit_util::ceil(100, 8) * 8;
validate_rle(
&values,
width as u8,
None,
1 + bit_util::ceil(width as i64 * num_values, 8) as i32,
);
}
}
fn test_rle_values(bit_width: usize, num_vals: usize, value: i32) {
let mod_val = if bit_width == 64 {
1
} else {
1u64 << bit_width
};
let mut values: Vec<i64> = vec![];
for v in 0..num_vals {
let val = if value == -1 {
v as i64 % mod_val as i64
} else {
value as i64
};
values.push(val);
}
validate_rle(&values, bit_width as u8, None, -1);
}
#[test]
fn test_values() {
for width in 1..MAX_WIDTH + 1 {
test_rle_values(width, 1, -1);
test_rle_values(width, 1024, -1);
test_rle_values(width, 1024, 0);
test_rle_values(width, 1024, 1);
}
}
#[test]
fn test_truncated_rle() {
let mut data: Vec<u8> = vec![
(3 << 1) | 1, ];
data.extend(std::iter::repeat(0xFF).take(20));
let data: Bytes = data.into();
let mut decoder = RleDecoder::new(8);
decoder.set_data(data.clone());
let mut output = vec![0_u16; 100];
let read = decoder.get_batch(&mut output).unwrap();
assert_eq!(read, 20);
assert!(output.iter().take(20).all(|x| *x == 255));
decoder.set_data(data);
let dict: Vec<u16> = (0..256).collect();
let mut output = vec![0_u16; 100];
let read = decoder
.get_batch_with_dict(&dict, &mut output, 100)
.unwrap();
assert_eq!(read, 20);
assert!(output.iter().take(20).all(|x| *x == 255));
}
#[test]
fn test_rle_padded() {
let values: Vec<i16> = vec![0, 1, 1, 3, 1, 0];
let bit_width = 2;
let buffer_len = RleEncoder::max_buffer_size(bit_width, values.len());
let mut encoder = RleEncoder::new(bit_width, buffer_len + 1);
for v in &values {
encoder.put(*v as u64)
}
let mut buffer = encoder.consume();
buffer.push(0);
let mut decoder = RleDecoder::new(bit_width);
decoder.set_data(buffer.into());
let mut actual_values: Vec<i16> = vec![0; 12];
let r = decoder
.get_batch(&mut actual_values)
.expect("get_batch() should be OK");
assert_eq!(r, 8);
assert_eq!(actual_values[..6], values);
assert_eq!(actual_values[6], 0);
assert_eq!(actual_values[7], 0);
}
#[test]
fn test_long_run() {
let mut writer = BitWriter::new(1024);
let bit_width = 1;
let num_values = 2002;
let run_bytes = ceil(num_values * bit_width, 8) as u64;
writer.put_vlq_int(run_bytes << 1 | 1);
for _ in 0..run_bytes {
writer.put_aligned(0xFF_u8, 1);
}
let buffer: Bytes = writer.consume().into();
let mut decoder = RleDecoder::new(1);
decoder.set_data(buffer.clone());
let mut decoded: Vec<i16> = vec![0; num_values];
let r = decoder.get_batch(&mut decoded).unwrap();
assert_eq!(r, num_values);
assert_eq!(vec![1; num_values], decoded);
decoder.set_data(buffer);
let r = decoder
.get_batch_with_dict(&[0, 23], &mut decoded, num_values)
.unwrap();
assert_eq!(r, num_values);
assert_eq!(vec![23; num_values], decoded);
}
#[test]
fn test_rle_specific_roundtrip() {
let bit_width = 1;
let values: Vec<i16> = vec![0, 1, 1, 1, 1, 0, 0, 0, 0, 1];
let buffer_len = RleEncoder::max_buffer_size(bit_width, values.len());
let mut encoder = RleEncoder::new(bit_width, buffer_len);
for v in &values {
encoder.put(*v as u64)
}
let buffer = encoder.consume();
let mut decoder = RleDecoder::new(bit_width);
decoder.set_data(Bytes::from(buffer));
let mut actual_values: Vec<i16> = vec![0; values.len()];
decoder
.get_batch(&mut actual_values)
.expect("get_batch() should be OK");
assert_eq!(actual_values, values);
}
fn test_round_trip(values: &[i32], bit_width: u8) {
let buffer_len = 64 * 1024;
let mut encoder = RleEncoder::new(bit_width, buffer_len);
for v in values {
encoder.put(*v as u64)
}
let buffer = Bytes::from(encoder.consume());
let mut decoder = RleDecoder::new(bit_width);
decoder.set_data(buffer.clone());
for v in values {
let val = decoder
.get::<i32>()
.expect("get() should be OK")
.expect("get() should return value");
assert_eq!(val, *v);
}
let mut decoder = RleDecoder::new(bit_width);
decoder.set_data(buffer);
let mut values_read: Vec<i32> = vec![0; values.len()];
decoder
.get_batch(&mut values_read[..])
.expect("get_batch() should be OK");
assert_eq!(&values_read[..], values);
}
#[test]
fn test_random() {
let seed_len = 32;
let niters = 50;
let ngroups = 1000;
let max_group_size = 15;
let mut values = vec![];
for _ in 0..niters {
values.clear();
let rng = thread_rng();
let seed_vec: Vec<u8> = rng.sample_iter::<u8, _>(&Standard).take(seed_len).collect();
let mut seed = [0u8; 32];
seed.copy_from_slice(&seed_vec[0..seed_len]);
let mut gen = rand::rngs::StdRng::from_seed(seed);
let mut parity = false;
for _ in 0..ngroups {
let mut group_size = gen.gen_range(1..20);
if group_size > max_group_size {
group_size = 1;
}
for _ in 0..group_size {
values.push(parity as i32);
}
parity = !parity;
}
let bit_width = bit_util::num_required_bits(values.len() as u64);
assert!(bit_width < 64);
test_round_trip(&values[..], bit_width);
}
}
}