artichoke_backend/extn/core/regexp/backend/
mod.rs

1use std::collections::HashMap;
2use std::fmt;
3use std::hash::{Hash, Hasher};
4
5use crate::extn::core::regexp::{Config, Encoding, Source};
6use crate::extn::prelude::*;
7
8#[cfg(feature = "core-regexp-oniguruma")]
9pub mod onig;
10pub mod regex;
11
12pub type NilableString = Option<Vec<u8>>;
13pub type NameToCaptureLocations = Vec<(Vec<u8>, Vec<usize>)>;
14
15#[derive(Debug, Clone, Hash, PartialEq, Eq, PartialOrd, Ord)]
16pub enum Scan {
17    Collected(Vec<Vec<Option<Vec<u8>>>>),
18    Patterns(Vec<Vec<u8>>),
19    Haystack,
20}
21
22impl TryConvertMut<Scan, Option<Value>> for Artichoke {
23    type Error = Error;
24
25    fn try_convert_mut(&mut self, from: Scan) -> Result<Option<Value>, Self::Error> {
26        match from {
27            Scan::Collected(collected) => {
28                let ary = self.try_convert_mut(collected)?;
29                Ok(Some(ary))
30            }
31            Scan::Patterns(patterns) => {
32                let ary = self.try_convert_mut(patterns)?;
33                Ok(Some(ary))
34            }
35            Scan::Haystack => Ok(None),
36        }
37    }
38}
39
40pub trait RegexpType {
41    fn box_clone(&self) -> Box<dyn RegexpType>;
42
43    fn debug(&self) -> String;
44
45    fn source(&self) -> &Source;
46
47    fn config(&self) -> &Config;
48
49    fn encoding(&self) -> &Encoding;
50
51    fn inspect(&self) -> Vec<u8>;
52
53    fn string(&self) -> &[u8];
54
55    fn captures(&self, haystack: &[u8]) -> Result<Option<Vec<NilableString>>, Error>;
56
57    fn capture_indexes_for_name(&self, name: &[u8]) -> Result<Option<Vec<usize>>, Error>;
58
59    fn captures_len(&self, haystack: Option<&[u8]>) -> Result<usize, Error>;
60
61    fn capture0<'a>(&self, haystack: &'a [u8]) -> Result<Option<&'a [u8]>, Error>;
62
63    fn case_match(&self, interp: &mut Artichoke, haystack: &[u8]) -> Result<bool, Error>;
64
65    fn is_match(&self, haystack: &[u8], pos: Option<i64>) -> Result<bool, Error>;
66
67    fn match_(
68        &self,
69        interp: &mut Artichoke,
70        haystack: &[u8],
71        pos: Option<i64>,
72        block: Option<Block>,
73    ) -> Result<Value, Error>;
74
75    fn match_operator(&self, interp: &mut Artichoke, haystack: &[u8]) -> Result<Option<usize>, Error>;
76
77    fn named_captures(&self) -> Result<NameToCaptureLocations, Error>;
78
79    fn named_captures_for_haystack(&self, haystack: &[u8]) -> Result<Option<HashMap<Vec<u8>, NilableString>>, Error>;
80
81    fn names(&self) -> Vec<Vec<u8>>;
82
83    fn pos(&self, haystack: &[u8], at: usize) -> Result<Option<(usize, usize)>, Error>;
84
85    fn scan(&self, interp: &mut Artichoke, haystack: &[u8], block: Option<Block>) -> Result<Scan, Error>;
86}
87
88impl Clone for Box<dyn RegexpType> {
89    #[inline]
90    fn clone(&self) -> Self {
91        self.box_clone()
92    }
93}
94
95impl fmt::Debug for Box<dyn RegexpType> {
96    #[inline]
97    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
98        fmt::Debug::fmt(&self.as_ref(), f)
99    }
100}
101
102impl Hash for Box<dyn RegexpType> {
103    #[inline]
104    fn hash<H: Hasher>(&self, state: &mut H) {
105        Hash::hash(&self.as_ref(), state);
106    }
107}
108
109impl PartialEq for Box<dyn RegexpType> {
110    #[inline]
111    fn eq(&self, other: &Self) -> bool {
112        PartialEq::eq(&self.as_ref(), &other.as_ref())
113    }
114}
115
116impl Eq for Box<dyn RegexpType> {}
117
118impl fmt::Debug for &dyn RegexpType {
119    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
120        f.write_str(&self.debug())
121    }
122}
123
124impl Hash for &dyn RegexpType {
125    fn hash<H: Hasher>(&self, state: &mut H) {
126        self.source().hash(state);
127    }
128}
129
130impl PartialEq for &dyn RegexpType {
131    fn eq(&self, other: &Self) -> bool {
132        self.config().pattern() == other.config().pattern() && self.encoding() == other.encoding()
133    }
134}
135
136impl Eq for &dyn RegexpType {}