spinoso_string/enc/binary/
codepoints.rs1use core::slice;
2
3#[derive(Debug, Clone)]
4pub struct Codepoints<'a> {
5 inner: slice::Iter<'a, u8>,
6}
7
8impl<'a> Codepoints<'a> {
9 #[inline]
10 pub fn new(bytes: &'a [u8]) -> Self {
11 Self { inner: bytes.iter() }
12 }
13}
14
15impl Iterator for Codepoints<'_> {
16 type Item = u32;
17
18 fn next(&mut self) -> Option<Self::Item> {
19 self.inner.next().map(|&b| u32::from(b))
20 }
21}
22
23impl Default for Codepoints<'_> {
24 #[inline]
25 fn default() -> Self {
26 Self::new(b"")
27 }
28}
29
30#[cfg(test)]
31mod tests {
32 use alloc::vec::Vec;
33
34 use super::*;
35 use crate::enc::binary::BinaryString;
36
37 #[test]
38 fn test_valid_ascii() {
39 let s = BinaryString::from("abc");
40 let codepoints = Codepoints::new(&s);
41 assert_eq!(codepoints.collect::<Vec<_>>(), &[97, 98, 99]);
42 }
43
44 #[test]
45 fn test_utf8_interpreted_as_bytes() {
46 let s = BinaryString::from("abc💎");
47 let codepoints = Codepoints::new(&s);
48 assert_eq!(codepoints.collect::<Vec<_>>(), &[97, 98, 99, 240, 159, 146, 142]);
49 }
50
51 #[test]
52 fn test_invalid_utf8_interpreted_as_bytes() {
53 let s = BinaryString::from(b"abc\xFF");
54 let codepoints = Codepoints::new(&s);
55 assert_eq!(codepoints.collect::<Vec<_>>(), &[97, 98, 99, 255]);
56 }
57}