Struct regex_automata::dfa::sparse::DFA

source · [−]

pub struct DFA<T> { /* private fields */ }

Expand description

A sparse deterministic finite automaton (DFA) with variable sized states.

In contrast to a dense::DFA, a sparse DFA uses a more space efficient representation for its transitions. Consequently, sparse DFAs may use much less memory than dense DFAs, but this comes at a price. In particular, reading the more space efficient transitions takes more work, and consequently, searching using a sparse DFA is typically slower than a dense DFA.

A sparse DFA can be built using the default configuration via the DFA::new constructor. Otherwise, one can configure various aspects of a dense DFA via dense::Builder, and then convert a dense DFA to a sparse DFA using dense::DFA::to_sparse.

In general, a sparse DFA supports all the same search operations as a dense DFA.

Making the choice between a dense and sparse DFA depends on your specific work load. If you can sacrifice a bit of search time performance, then a sparse DFA might be the best choice. In particular, while sparse DFAs are probably always slower than dense DFAs, you may find that they are easily fast enough for your purposes!

Type parameters

A DFA has one type parameter, T, which is used to represent the parts of a sparse DFA. T is typically a Vec<u8> or a &[u8].

The `Automaton` trait

This type implements the Automaton trait, which means it can be used for searching. For example:

use regex_automata::{
    dfa::{Automaton, sparse::DFA},
    HalfMatch,
};

let dfa = DFA::new("foo[0-9]+")?;
let expected = HalfMatch::must(0, 8);
assert_eq!(Some(expected), dfa.find_leftmost_fwd(b"foo12345")?);

Struct regex_automata::dfa::sparse::DFA

Implementations

impl DFA<Vec<u8>>

pub fn new(pattern: &str) -> Result<DFA<Vec<u8>>, Error>

pub fn new_many<P: AsRef<str>>(patterns: &[P]) -> Result<DFA<Vec<u8>>, Error>

impl DFA<Vec<u8>>

pub fn always_match() -> Result<DFA<Vec<u8>>, Error>

pub fn never_match() -> Result<DFA<Vec<u8>>, Error>

impl<T: AsRef<[u8]>> DFA<T>

pub fn as_ref<'a>(&'a self) -> DFA<&'a [u8]>

pub fn to_owned(&self) -> DFA<Vec<u8>>

pub fn memory_usage(&self) -> usize

pub fn has_starts_for_each_pattern(&self) -> bool

impl<T: AsRef<[u8]>> DFA<T>

pub fn to_bytes_little_endian(&self) -> Vec<u8>ⓘNotable traits for Vec<u8, A>impl<A> Write for Vec<u8, A> where A: Allocator,

pub fn to_bytes_big_endian(&self) -> Vec<u8>ⓘNotable traits for Vec<u8, A>impl<A> Write for Vec<u8, A> where A: Allocator,

pub fn to_bytes_native_endian(&self) -> Vec<u8>ⓘNotable traits for Vec<u8, A>impl<A> Write for Vec<u8, A> where A: Allocator,

pub fn write_to_little_endian( &self, dst: &mut [u8]) -> Result<usize, SerializeError>

pub fn write_to_big_endian( &self, dst: &mut [u8]) -> Result<usize, SerializeError>

pub fn write_to_native_endian( &self, dst: &mut [u8]) -> Result<usize, SerializeError>

pub fn write_to_len(&self) -> usize

impl<'a> DFA<&'a [u8]>

pub fn from_bytes( slice: &'a [u8]) -> Result<(DFA<&'a [u8]>, usize), DeserializeError>

pub unsafe fn from_bytes_unchecked( slice: &'a [u8]) -> Result<(DFA<&'a [u8]>, usize), DeserializeError>

Trait Implementations

impl<T: AsRef<[u8]>> Automaton for DFA<T>

fn is_special_state(&self, id: StateID) -> bool

fn is_dead_state(&self, id: StateID) -> bool

fn is_quit_state(&self, id: StateID) -> bool

fn is_match_state(&self, id: StateID) -> bool

fn is_start_state(&self, id: StateID) -> bool

fn is_accel_state(&self, id: StateID) -> bool

fn next_state(&self, current: StateID, input: u8) -> StateID

unsafe fn next_state_unchecked(&self, current: StateID, input: u8) -> StateID

fn next_eoi_state(&self, current: StateID) -> StateID

fn pattern_count(&self) -> usize

fn match_count(&self, id: StateID) -> usize

fn match_pattern(&self, id: StateID, match_index: usize) -> PatternID

fn start_state_forward( &self, pattern_id: Option<PatternID>, bytes: &[u8], start: usize, end: usize) -> StateID

fn start_state_reverse( &self, pattern_id: Option<PatternID>, bytes: &[u8], start: usize, end: usize) -> StateID

fn accelerator(&self, id: StateID) -> &[u8]ⓘNotable traits for &'_ mut [u8]impl<'_> Write for &'_ mut [u8]impl<'_> Read for &'_ [u8]

fn find_earliest_fwd( &self, bytes: &[u8]) -> Result<Option<HalfMatch>, MatchError>

fn find_earliest_rev( &self, bytes: &[u8]) -> Result<Option<HalfMatch>, MatchError>

fn find_leftmost_fwd( &self, bytes: &[u8]) -> Result<Option<HalfMatch>, MatchError>

fn find_leftmost_rev( &self, bytes: &[u8]) -> Result<Option<HalfMatch>, MatchError>

fn find_overlapping_fwd( &self, bytes: &[u8], state: &mut OverlappingState) -> Result<Option<HalfMatch>, MatchError>

fn find_earliest_fwd_at( &self, pre: Option<&mut Scanner<'_>>, pattern_id: Option<PatternID>, bytes: &[u8], start: usize, end: usize) -> Result<Option<HalfMatch>, MatchError>

fn find_earliest_rev_at( &self, pattern_id: Option<PatternID>, bytes: &[u8], start: usize, end: usize) -> Result<Option<HalfMatch>, MatchError>

fn find_leftmost_fwd_at( &self, pre: Option<&mut Scanner<'_>>, pattern_id: Option<PatternID>, bytes: &[u8], start: usize, end: usize) -> Result<Option<HalfMatch>, MatchError>

fn find_leftmost_rev_at( &self, pattern_id: Option<PatternID>, bytes: &[u8], start: usize, end: usize) -> Result<Option<HalfMatch>, MatchError>

fn find_overlapping_fwd_at( &self, pre: Option<&mut Scanner<'_>>, pattern_id: Option<PatternID>, bytes: &[u8], start: usize, end: usize, state: &mut OverlappingState) -> Result<Option<HalfMatch>, MatchError>

impl<T: Clone> Clone for DFA<T>

fn clone(&self) -> DFA<T>

fn clone_from(&mut self, source: &Self)

impl<T: AsRef<[u8]>> Debug for DFA<T>

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Auto Trait Implementations

impl<T> RefUnwindSafe for DFA<T> where T: RefUnwindSafe,

impl<T> Send for DFA<T> where T: Send,

impl<T> Sync for DFA<T> where T: Sync,

impl<T> Unpin for DFA<T> where T: Unpin,

impl<T> UnwindSafe for DFA<T> where T: UnwindSafe,

Blanket Implementations

impl<T> Any for T where T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for T where T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for T where T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for T where U: From<T>,

fn into(self) -> U

impl<T> ToOwned for T where T: Clone,

type Owned = T

fn to_owned(&self) -> T

fn clone_into(&self, target: &mut T)

impl<T, U> TryFrom<U> for T where U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T: AsRef<[u8 ]>> DFA<T>

pub fn as_ref<'a>(&'a self) -> DFA<&'a [u8 ]>

impl<T: AsRef<[u8 ]>> DFA<T>

pub fn to_bytes_little_endian(&self) -> Vec<u8>ⓘNotable traits for Vec<u8, A>`impl<A> Write for Vec<u8, A> where A: Allocator,`

pub fn to_bytes_big_endian(&self) -> Vec<u8>ⓘNotable traits for Vec<u8, A>`impl<A> Write for Vec<u8, A> where A: Allocator,`

pub fn to_bytes_native_endian(&self) -> Vec<u8>ⓘNotable traits for Vec<u8, A>`impl<A> Write for Vec<u8, A> where A: Allocator,`

pub fn write_to_little_endian(
&self,
dst: &mut [u8 ]
) -> Result<usize, SerializeError>

pub fn write_to_big_endian(
&self,
dst: &mut [u8 ]
) -> Result<usize, SerializeError>

pub fn write_to_native_endian(
&self,
dst: &mut [u8 ]
) -> Result<usize, SerializeError>

impl<'a> DFA<&'a [u8 ]>

pub fn from_bytes(
slice: &'a [u8 ]
) -> Result<(DFA<&'a [u8 ]>, usize ), DeserializeError>

pub unsafe fn from_bytes_unchecked(
slice: &'a [u8 ]
) -> Result<(DFA<&'a [u8 ]>, usize ), DeserializeError>

impl<T: AsRef<[u8 ]>> Automaton for DFA<T>

fn start_state_forward(
&self,
pattern_id: Option<PatternID>,
bytes: &[u8 ],
start: usize,
end: usize
) -> StateID

fn start_state_reverse(
&self,
pattern_id: Option<PatternID>,
bytes: &[u8 ],
start: usize,
end: usize
) -> StateID

fn accelerator(&self, id: StateID) -> &[u8 ]ⓘNotable traits for &'_ mut [u8 ]`impl<'_> Write for &'_ mut [u8]impl<'_> Read for &'_ [u8]`

fn find_earliest_fwd(
&self,
bytes: &[u8 ]
) -> Result<Option<HalfMatch>, MatchError>

fn find_earliest_rev(
&self,
bytes: &[u8 ]
) -> Result<Option<HalfMatch>, MatchError>

fn find_leftmost_fwd(
&self,
bytes: &[u8 ]
) -> Result<Option<HalfMatch>, MatchError>

fn find_leftmost_rev(
&self,
bytes: &[u8 ]
) -> Result<Option<HalfMatch>, MatchError>

fn find_overlapping_fwd(
&self,
bytes: &[u8 ],
state: &mut OverlappingState
) -> Result<Option<HalfMatch>, MatchError>

fn find_earliest_fwd_at(
&self,
pre: Option<&mut Scanner<'_>>,
pattern_id: Option<PatternID>,
bytes: &[u8 ],
start: usize,
end: usize
) -> Result<Option<HalfMatch>, MatchError>

fn find_earliest_rev_at(
&self,
pattern_id: Option<PatternID>,
bytes: &[u8 ],
start: usize,
end: usize
) -> Result<Option<HalfMatch>, MatchError>

fn find_leftmost_fwd_at(
&self,
pre: Option<&mut Scanner<'_>>,
pattern_id: Option<PatternID>,
bytes: &[u8 ],
start: usize,
end: usize
) -> Result<Option<HalfMatch>, MatchError>

fn find_leftmost_rev_at(
&self,
pattern_id: Option<PatternID>,
bytes: &[u8 ],
start: usize,
end: usize
) -> Result<Option<HalfMatch>, MatchError>

fn find_overlapping_fwd_at(
&self,
pre: Option<&mut Scanner<'_>>,
pattern_id: Option<PatternID>,
bytes: &[u8 ],
start: usize,
end: usize,
state: &mut OverlappingState
) -> Result<Option<HalfMatch>, MatchError>

impl<T: AsRef<[u8 ]>> Debug for DFA<T>

impl<T> RefUnwindSafe for DFA<T> where
T: RefUnwindSafe,

impl<T> Send for DFA<T> where
T: Send,

impl<T> Sync for DFA<T> where
T: Sync,

impl<T> Unpin for DFA<T> where
T: Unpin,

impl<T> UnwindSafe for DFA<T> where
T: UnwindSafe,

impl<T> Any for T where
T: 'static + ?Sized,

impl<T> Borrow<T> for T where
T: ?Sized,

impl<T> BorrowMut<T> for T where
T: ?Sized,

impl<T, U> Into<U> for T where
U: From<T>,

impl<T> ToOwned for T where
T: Clone,

impl<T, U> TryFrom<U> for T where
U: Into<T>,

impl<T, U> TryInto<U> for T where
U: TryFrom<T>,