1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
use crate::encoding::ceil8;
use crate::read::levels::get_bit_width;
use super::super::bitpacking;
use super::super::uleb128;
use super::super::zigzag_leb128;
pub fn encode<I: Iterator<Item = i64>>(mut iterator: I, buffer: &mut Vec<u8>) {
let block_size = 128;
let mini_blocks = 1;
let mut container = [0u8; 10];
let encoded_len = uleb128::encode(block_size, &mut container);
buffer.extend_from_slice(&container[..encoded_len]);
let encoded_len = uleb128::encode(mini_blocks, &mut container);
buffer.extend_from_slice(&container[..encoded_len]);
let length = iterator.size_hint().1.unwrap();
let encoded_len = uleb128::encode(length as u64, &mut container);
buffer.extend_from_slice(&container[..encoded_len]);
let mut values = [0i64; 128];
let mut deltas = [0u32; 128];
let first_value = iterator.next().unwrap().into();
let (container, encoded_len) = zigzag_leb128::encode(first_value);
buffer.extend_from_slice(&container[..encoded_len]);
let mut prev = first_value;
let mut length = iterator.size_hint().1.unwrap();
while length != 0 {
for (i, v) in (0..128).zip(&mut iterator) {
let v: i64 = v.into();
values[i] = v - prev;
prev = v;
}
let consumed = std::cmp::min(length - iterator.size_hint().1.unwrap(), 128);
let values = &values[..consumed];
let min_delta = *values.iter().min().unwrap();
let max_delta = *values.iter().max().unwrap();
values.iter().zip(deltas.iter_mut()).for_each(|(v, d)| {
*d = (v - min_delta) as u32;
});
let (container, encoded_len) = zigzag_leb128::encode(min_delta);
buffer.extend_from_slice(&container[..encoded_len]);
let num_bits = get_bit_width((max_delta - min_delta) as i16) as u8;
buffer.push(num_bits);
if num_bits > 0 {
let start = buffer.len();
let bytes_needed = start + ceil8(deltas.len() * num_bits as usize);
buffer.resize(bytes_needed, 0);
bitpacking::encode(deltas.as_ref(), num_bits, &mut buffer[start..]);
let bytes_needed = start + ceil8(deltas.len() * num_bits as usize);
buffer.truncate(bytes_needed);
}
length = iterator.size_hint().1.unwrap();
}
}
#[cfg(test)]
mod tests {
use super::*;
#[test]
fn constant_delta() {
let data = 1..=5;
let expected = vec![128u8, 1, 1, 5, 2, 2, 0];
let mut buffer = vec![];
encode(data, &mut buffer);
assert_eq!(expected, buffer);
}
#[test]
fn negative_min_delta() {
let data = vec![1, 2, 3, 4, 5, 1];
let mut expected = vec![128u8, 1, 1, 6, 2, 7, 3, 0b01101101, 0b00001011];
expected.extend(std::iter::repeat(0).take(128 * 3 / 8 - 2));
let mut buffer = vec![];
encode(data.into_iter(), &mut buffer);
assert_eq!(expected, buffer);
}
}