spinoso_string/enc/binary/
codepoints.rs

1use core::slice;
2
3#[derive(Debug, Clone)]
4pub struct Codepoints<'a> {
5    inner: slice::Iter<'a, u8>,
6}
7
8impl<'a> Codepoints<'a> {
9    #[inline]
10    pub fn new(bytes: &'a [u8]) -> Self {
11        Self { inner: bytes.iter() }
12    }
13}
14
15impl Iterator for Codepoints<'_> {
16    type Item = u32;
17
18    fn next(&mut self) -> Option<Self::Item> {
19        self.inner.next().map(|&b| u32::from(b))
20    }
21}
22
23impl Default for Codepoints<'_> {
24    #[inline]
25    fn default() -> Self {
26        Self::new(b"")
27    }
28}
29
30#[cfg(test)]
31mod tests {
32    use alloc::vec::Vec;
33
34    use super::*;
35    use crate::enc::binary::BinaryString;
36
37    #[test]
38    fn test_valid_ascii() {
39        let s = BinaryString::from("abc");
40        let codepoints = Codepoints::new(&s);
41        assert_eq!(codepoints.collect::<Vec<_>>(), &[97, 98, 99]);
42    }
43
44    #[test]
45    fn test_utf8_interpreted_as_bytes() {
46        let s = BinaryString::from("abc💎");
47        let codepoints = Codepoints::new(&s);
48        assert_eq!(codepoints.collect::<Vec<_>>(), &[97, 98, 99, 240, 159, 146, 142]);
49    }
50
51    #[test]
52    fn test_invalid_utf8_interpreted_as_bytes() {
53        let s = BinaryString::from(b"abc\xFF");
54        let codepoints = Codepoints::new(&s);
55        assert_eq!(codepoints.collect::<Vec<_>>(), &[97, 98, 99, 255]);
56    }
57}