winnow/binary/bits/mod.rs
1//! Bit level parsers
2//!
3
4#[cfg(test)]
5mod tests;
6
7use crate::combinator::trace;
8use crate::error::{ErrorConvert, Needed, ParserError};
9use crate::lib::std::ops::{AddAssign, Div, Shl, Shr};
10use crate::stream::{Stream, StreamIsPartial, ToUsize};
11use crate::{Parser, Result};
12
13/// Number of bits in a byte
14const BYTE: usize = u8::BITS as usize;
15
16/// Converts a byte-level input to a bit-level input
17///
18/// See [`bytes`] to convert it back.
19///
20/// # Example
21/// ```rust
22/// # use winnow::prelude::*;
23/// # use winnow::Bytes;
24/// # use winnow::binary::bits::{bits, take};
25/// # use winnow::error::ContextError;
26/// # use winnow::error::ErrMode;
27/// type Stream<'i> = &'i Bytes;
28///
29/// fn stream(b: &[u8]) -> Stream<'_> {
30/// Bytes::new(b)
31/// }
32///
33/// fn parse(input: &mut Stream<'_>) -> ModalResult<(u8, u8)> {
34/// bits::<_, _, ErrMode<ContextError>, _, _>((take(4usize), take(8usize))).parse_next(input)
35/// }
36///
37/// let input = stream(&[0x12, 0x34, 0xff, 0xff]);
38///
39/// let output = parse.parse_peek(input).expect("We take 1.5 bytes and the input is longer than 2 bytes");
40///
41/// // The first byte is consumed, the second byte is partially consumed and dropped.
42/// let remaining = output.0;
43/// assert_eq!(remaining, stream(&[0xff, 0xff]));
44///
45/// let parsed = output.1;
46/// assert_eq!(parsed.0, 0x01);
47/// assert_eq!(parsed.1, 0x23);
48/// ```
49pub fn bits<Input, Output, BitError, ByteError, ParseNext>(
50 mut parser: ParseNext,
51) -> impl Parser<Input, Output, ByteError>
52where
53 BitError: ParserError<(Input, usize)> + ErrorConvert<ByteError>,
54 ByteError: ParserError<Input>,
55 (Input, usize): Stream,
56 Input: Stream + Clone,
57 ParseNext: Parser<(Input, usize), Output, BitError>,
58{
59 trace("bits", move |input: &mut Input| {
60 let mut bit_input = (input.clone(), 0);
61 match parser.parse_next(&mut bit_input) {
62 Ok(result) => {
63 let (mut rest, offset) = bit_input;
64 // If the next byte has been partially read, it will be sliced away as well.
65 // The parser functions might already slice away all fully read bytes.
66 // That's why `offset / BYTE` isn't necessarily needed at all times.
67 let remaining_bytes_index = offset / BYTE + if offset % BYTE == 0 { 0 } else { 1 };
68 let _ = rest.next_slice(remaining_bytes_index);
69 *input = rest;
70 Ok(result)
71 }
72 Err(e) => match e.needed() {
73 Some(n) => Err(ParserError::incomplete(
74 input,
75 n.map(|u| u.get() / BYTE + 1),
76 )),
77 None => Err(ErrorConvert::convert(e)),
78 },
79 }
80 })
81}
82
83/// Convert a [`bits`] stream back into a byte stream
84///
85/// <div class="warning">
86///
87/// **Warning:** A partial byte remaining in the input will be ignored and the given parser will
88/// start parsing at the next full byte.
89///
90/// </div>
91///
92/// # Examples
93///
94/// ```
95/// # use winnow::prelude::*;
96/// # use winnow::Bytes;
97/// # use winnow::token::rest;
98/// # use winnow::error::ContextError;
99/// # use winnow::error::ErrMode;
100/// use winnow::binary::bits::{bits, bytes, take};
101///
102/// type Stream<'i> = &'i Bytes;
103///
104/// fn stream(b: &[u8]) -> Stream<'_> {
105/// Bytes::new(b)
106/// }
107///
108/// fn parse<'i>(input: &mut Stream<'i>) -> ModalResult<(u8, u8, &'i [u8])> {
109/// bits::<_, _, ErrMode<ContextError>, _, _>((
110/// take(4usize),
111/// take(8usize),
112/// bytes::<_, _, ErrMode<ContextError>, _, _>(rest)
113/// )).parse_next(input)
114/// }
115///
116/// let input = stream(&[0x12, 0x34, 0xff, 0xff]);
117///
118/// assert_eq!(parse.parse_peek(input), Ok(( stream(&[]), (0x01, 0x23, &[0xff, 0xff][..]) )));
119/// ```
120pub fn bytes<Input, Output, ByteError, BitError, ParseNext>(
121 mut parser: ParseNext,
122) -> impl Parser<(Input, usize), Output, BitError>
123where
124 ByteError: ParserError<Input> + ErrorConvert<BitError>,
125 BitError: ParserError<(Input, usize)>,
126 Input: Stream<Token = u8> + Clone,
127 ParseNext: Parser<Input, Output, ByteError>,
128{
129 trace("bytes", move |bit_input: &mut (Input, usize)| {
130 let (mut input, offset) = bit_input.clone();
131 let _ = if offset % BYTE != 0 {
132 input.next_slice(1 + offset / BYTE)
133 } else {
134 input.next_slice(offset / BYTE)
135 };
136 match parser.parse_next(&mut input) {
137 Ok(res) => {
138 *bit_input = (input, 0);
139 Ok(res)
140 }
141 Err(e) => match e.needed() {
142 Some(Needed::Unknown) => Err(ParserError::incomplete(bit_input, Needed::Unknown)),
143 Some(Needed::Size(sz)) => Err(match sz.get().checked_mul(BYTE) {
144 Some(v) => ParserError::incomplete(bit_input, Needed::new(v)),
145 None => ParserError::assert(
146 bit_input,
147 "overflow in turning needed bytes into needed bits",
148 ),
149 }),
150 None => Err(ErrorConvert::convert(e)),
151 },
152 }
153 })
154}
155
156/// Parse taking `count` bits
157///
158/// # Effective Signature
159///
160/// Assuming you are parsing a `(&[u8], usize)` bit [Stream]:
161/// ```rust
162/// # use winnow::prelude::*;;
163/// # use winnow::error::ContextError;
164/// pub fn take<'i>(count: usize) -> impl Parser<(&'i [u8], usize), u8, ContextError>
165/// # {
166/// # winnow::binary::bits::take(count)
167/// # }
168/// ```
169///
170/// # Example
171/// ```rust
172/// # use winnow::prelude::*;
173/// # use winnow::Bytes;
174/// # use winnow::error::ContextError;
175/// use winnow::binary::bits::take;
176///
177/// type Stream<'i> = &'i Bytes;
178///
179/// fn stream(b: &[u8]) -> Stream<'_> {
180/// Bytes::new(b)
181/// }
182///
183/// // Consumes 0 bits, returns 0
184/// assert_eq!(take::<_, usize, _, ContextError>(0usize).parse_peek((stream(&[0b00010010]), 0)), Ok(((stream(&[0b00010010]), 0), 0)));
185///
186/// // Consumes 4 bits, returns their values and increase offset to 4
187/// assert_eq!(take::<_, usize, _, ContextError>(4usize).parse_peek((stream(&[0b00010010]), 0)), Ok(((stream(&[0b00010010]), 4), 0b00000001)));
188///
189/// // Consumes 4 bits, offset is 4, returns their values and increase offset to 0 of next byte
190/// assert_eq!(take::<_, usize, _, ContextError>(4usize).parse_peek((stream(&[0b00010010]), 4)), Ok(((stream(&[]), 0), 0b00000010)));
191///
192/// // Tries to consume 12 bits but only 8 are available
193/// assert!(take::<_, usize, _, ContextError>(12usize).parse_peek((stream(&[0b00010010]), 0)).is_err());
194/// ```
195#[inline(always)]
196pub fn take<Input, Output, Count, Error>(count: Count) -> impl Parser<(Input, usize), Output, Error>
197where
198 Input: Stream<Token = u8> + StreamIsPartial + Clone,
199 Output: From<u8> + AddAssign + Shl<usize, Output = Output> + Shr<usize, Output = Output>,
200 Count: ToUsize,
201 Error: ParserError<(Input, usize)>,
202{
203 let count = count.to_usize();
204 trace("take", move |input: &mut (Input, usize)| {
205 if <Input as StreamIsPartial>::is_partial_supported() {
206 take_::<_, _, _, true>(input, count)
207 } else {
208 take_::<_, _, _, false>(input, count)
209 }
210 })
211}
212
213fn take_<I, O, E: ParserError<(I, usize)>, const PARTIAL: bool>(
214 bit_input: &mut (I, usize),
215 count: usize,
216) -> Result<O, E>
217where
218 I: StreamIsPartial,
219 I: Stream<Token = u8> + Clone,
220 O: From<u8> + AddAssign + Shl<usize, Output = O> + Shr<usize, Output = O>,
221{
222 if count == 0 {
223 Ok(0u8.into())
224 } else {
225 let (mut input, bit_offset) = bit_input.clone();
226 if input.eof_offset() * BYTE < count + bit_offset {
227 if PARTIAL && input.is_partial() {
228 Err(ParserError::incomplete(bit_input, Needed::new(count)))
229 } else {
230 Err(ParserError::from_input(&(input, bit_offset)))
231 }
232 } else {
233 let cnt = (count + bit_offset).div(BYTE);
234 let mut acc: O = 0_u8.into();
235 let mut offset: usize = bit_offset;
236 let mut remaining: usize = count;
237 let mut end_offset: usize = 0;
238
239 for (_, byte) in input.iter_offsets().take(cnt + 1) {
240 if remaining == 0 {
241 break;
242 }
243 let val: O = if offset == 0 {
244 byte.into()
245 } else {
246 (byte << offset >> offset).into()
247 };
248
249 if remaining < BYTE - offset {
250 acc += val >> (BYTE - offset - remaining);
251 end_offset = remaining + offset;
252 break;
253 } else {
254 acc += val << (remaining - (BYTE - offset));
255 remaining -= BYTE - offset;
256 offset = 0;
257 }
258 }
259 let _ = input.next_slice(cnt);
260 *bit_input = (input, end_offset);
261 Ok(acc)
262 }
263 }
264}
265
266/// Parse taking `count` bits and comparing them to `pattern`
267///
268/// # Effective Signature
269///
270/// Assuming you are parsing a `(&[u8], usize)` bit [Stream]:
271/// ```rust
272/// # use winnow::prelude::*;;
273/// # use winnow::error::ContextError;
274/// pub fn pattern<'i>(pattern: u8, count: usize) -> impl Parser<(&'i [u8], usize), u8, ContextError>
275/// # {
276/// # winnow::binary::bits::pattern(pattern, count)
277/// # }
278/// ```
279///
280/// # Example
281///
282/// ```rust
283/// # use winnow::prelude::*;
284/// # use winnow::Bytes;
285/// # use winnow::error::ContextError;
286/// use winnow::binary::bits::pattern;
287///
288/// type Stream<'i> = &'i Bytes;
289///
290/// fn stream(b: &[u8]) -> Stream<'_> {
291/// Bytes::new(b)
292/// }
293///
294/// /// Compare the lowest `count` bits of `input` against the lowest `count` bits of `pattern`.
295/// /// Return Ok and the matching section of `input` if there's a match.
296/// /// Return Err if there's no match.
297/// fn parser(bits: u8, count: u8, input: &mut (Stream<'_>, usize)) -> ModalResult<u8> {
298/// pattern(bits, count).parse_next(input)
299/// }
300///
301/// // The lowest 4 bits of 0b00001111 match the lowest 4 bits of 0b11111111.
302/// assert_eq!(
303/// pattern::<_, usize, _, ContextError>(0b0000_1111, 4usize).parse_peek((stream(&[0b1111_1111]), 0)),
304/// Ok(((stream(&[0b1111_1111]), 4), 0b0000_1111))
305/// );
306///
307/// // The lowest bit of 0b00001111 matches the lowest bit of 0b11111111 (both are 1).
308/// assert_eq!(
309/// pattern::<_, usize, _, ContextError>(0b00000001, 1usize).parse_peek((stream(&[0b11111111]), 0)),
310/// Ok(((stream(&[0b11111111]), 1), 0b00000001))
311/// );
312///
313/// // The lowest 2 bits of 0b11111111 and 0b00000001 are different.
314/// assert!(pattern::<_, usize, _, ContextError>(0b000000_01, 2usize).parse_peek((stream(&[0b111111_11]), 0)).is_err());
315///
316/// // The lowest 8 bits of 0b11111111 and 0b11111110 are different.
317/// assert!(pattern::<_, usize, _, ContextError>(0b11111110, 8usize).parse_peek((stream(&[0b11111111]), 0)).is_err());
318/// ```
319#[inline(always)]
320#[doc(alias = "literal")]
321#[doc(alias = "just")]
322#[doc(alias = "tag")]
323pub fn pattern<Input, Output, Count, Error: ParserError<(Input, usize)>>(
324 pattern: Output,
325 count: Count,
326) -> impl Parser<(Input, usize), Output, Error>
327where
328 Input: Stream<Token = u8> + StreamIsPartial + Clone,
329 Count: ToUsize,
330 Output: From<u8>
331 + AddAssign
332 + Shl<usize, Output = Output>
333 + Shr<usize, Output = Output>
334 + PartialEq,
335{
336 let count = count.to_usize();
337 trace("pattern", move |input: &mut (Input, usize)| {
338 let start = input.checkpoint();
339
340 take(count).parse_next(input).and_then(|o| {
341 if pattern == o {
342 Ok(o)
343 } else {
344 input.reset(&start);
345 Err(ParserError::from_input(input))
346 }
347 })
348 })
349}
350
351/// Parses one specific bit as a bool.
352///
353/// # Effective Signature
354///
355/// Assuming you are parsing a `(&[u8], usize)` bit [Stream]:
356/// ```rust
357/// # use winnow::prelude::*;;
358/// # use winnow::error::ContextError;
359/// pub fn bool(input: &mut (&[u8], usize)) -> ModalResult<bool>
360/// # {
361/// # winnow::binary::bits::bool.parse_next(input)
362/// # }
363/// ```
364///
365/// # Example
366///
367/// ```rust
368/// # use winnow::prelude::*;
369/// # use winnow::Bytes;
370/// # use winnow::error::InputError;
371/// use winnow::binary::bits::bool;
372///
373/// type Stream<'i> = &'i Bytes;
374///
375/// fn stream(b: &[u8]) -> Stream<'_> {
376/// Bytes::new(b)
377/// }
378///
379/// fn parse(input: &mut (Stream<'_>, usize)) -> ModalResult<bool> {
380/// bool.parse_next(input)
381/// }
382///
383/// assert_eq!(parse.parse_peek((stream(&[0b10000000]), 0)), Ok(((stream(&[0b10000000]), 1), true)));
384/// assert_eq!(parse.parse_peek((stream(&[0b10000000]), 1)), Ok(((stream(&[0b10000000]), 2), false)));
385/// ```
386#[doc(alias = "any")]
387pub fn bool<Input, Error: ParserError<(Input, usize)>>(
388 input: &mut (Input, usize),
389) -> Result<bool, Error>
390where
391 Input: Stream<Token = u8> + StreamIsPartial + Clone,
392{
393 trace("bool", |input: &mut (Input, usize)| {
394 let bit: u32 = take(1usize).parse_next(input)?;
395 Ok(bit != 0)
396 })
397 .parse_next(input)
398}