Struct utf8_ranges::Utf8Sequences [−] [src]

pub struct Utf8Sequences {
    // some fields omitted
}

[−]

An iterator over ranges of matching UTF-8 byte sequences.

The iteration represents an alternation of comprehensive byte sequences that match precisely the set of UTF-8 encoded scalar values.

A byte sequence corresponds to one of the scalar values in the range given if and only if it completely matches exactly one of the sequences of byte ranges produced by this iterator.

Each sequence of byte ranges matches a unique set of bytes. That is, no two sequences will match the same bytes.

Example

This shows how to match an arbitrary byte sequence against a range of scalar values.

use utf8_ranges::{Utf8Sequences, Utf8Sequence};

fn matches(seqs: &[Utf8Sequence], bytes: &[u8]) -> bool {
    for range in seqs {
        if range.matches(bytes) {
            return true;
        }
    }
    false
}

// Test the basic multilingual plane.
let seqs: Vec<_> = Utf8Sequences::new('\u{0}', '\u{FFFF}').collect();

// UTF-8 encoding of 'a'.
assert!(matches(&seqs, &[0x61]));
// UTF-8 encoding of '☃' (`\u{2603}`).
assert!(matches(&seqs, &[0xE2, 0x98, 0x83]));
// UTF-8 encoding of `\u{10348}` (outside the BMP).
assert!(!matches(&seqs, &[0xF0, 0x90, 0x8D, 0x88]));
// Tries to match against a UTF-8 encoding of a surrogate codepoint,
// which is invalid UTF-8, and therefore fails, despite the fact that
// the corresponding codepoint (0xD800) falls in the range given.
assert!(!matches(&seqs, &[0xED, 0xA0, 0x80]));
// And fails against plain old invalid UTF-8.
assert!(!matches(&seqs, &[0xFF, 0xFF]));

If this example seems circuitous, that's because it is! It's meant to be illustrative. In practice, you could just try to decode your byte sequence and compare it with the scalar value range directly. However, this is not always possible (for example, in a byte based automaton).

Methods

`impl Utf8Sequences`

`fn new(start: char, end: char) -> Self`[−]

Create a new iterator over UTF-8 byte ranges for the scalar value range given.

Trait Implementations

`impl Iterator for Utf8Sequences`

`type Item = Utf8Sequence`

`fn next(&mut self) -> Option<Self::Item>`

`fn size_hint(&self) -> (usize, Option<usize>)`

`fn count(self) -> usize`

`fn last(self) -> Option<Self::Item>`

`fn nth(&mut self, n: usize) -> Option<Self::Item>`

`fn chain(self, other: U) -> Chain<Self, U::IntoIter> where U: IntoIterator<Item=Self::Item>`

`fn zip(self, other: U) -> Zip<Self, U::IntoIter> where U: IntoIterator`

`fn map<B, F>(self, f: F) -> Map<Self, F> where F: FnMut(Self::Item) -> B`

`fn filter(self, predicate: P) -> Filter<Self, P> where P: FnMut(&Self::Item) -> bool`

`fn filter_map<B, F>(self, f: F) -> FilterMap<Self, F> where F: FnMut(Self::Item) -> Option`

`fn enumerate(self) -> Enumerate<Self>`

`fn peekable(self) -> Peekable<Self>`

`fn skip_while(self, predicate: P) -> SkipWhile<Self, P> where P: FnMut(&Self::Item) -> bool`

`fn take_while(self, predicate: P) -> TakeWhile<Self, P> where P: FnMut(&Self::Item) -> bool`

`fn skip(self, n: usize) -> Skip<Self>`

`fn take(self, n: usize) -> Take<Self>`

`fn scan<St, B, F>(self, initial_state: St, f: F) -> Scan<Self, St, F> where F: FnMut(&mut St, Self::Item) -> Option`

`fn flat_map<U, F>(self, f: F) -> FlatMap<Self, U, F> where F: FnMut(Self::Item) -> U, U: IntoIterator`

`fn fuse(self) -> Fuse<Self>`

`fn inspect<F>(self, f: F) -> Inspect<Self, F> where F: FnMut(&Self::Item) -> ()`

`fn by_ref(&mut self) -> &mut Self`

`fn collect(self) -> B where B: FromIterator<Self::Item>`

`fn partition<B, F>(self, f: F) -> (B, B) where F: FnMut(&Self::Item) -> bool, B: Default + Extend<Self::Item>`

`fn fold<B, F>(self, init: B, f: F) -> B where F: FnMut(B, Self::Item) -> B`

`fn all<F>(&mut self, f: F) -> bool where F: FnMut(Self::Item) -> bool`

`fn any<F>(&mut self, f: F) -> bool where F: FnMut(Self::Item) -> bool`

`fn find(&mut self, predicate: P) -> Option<Self::Item> where P: FnMut(&Self::Item) -> bool`

`fn position(&mut self, predicate: P) -> Option<usize> where P: FnMut(Self::Item) -> bool`

`fn rposition(&mut self, predicate: P) -> Option<usize> where Self: ExactSizeIterator + DoubleEndedIterator, P: FnMut(Self::Item) -> bool`

`fn max(self) -> Option<Self::Item> where Self::Item: Ord`

`fn min(self) -> Option<Self::Item> where Self::Item: Ord`

`fn max_by<B, F>(self, f: F) -> Option<Self::Item> where B: Ord, F: FnMut(&Self::Item) -> B`

`fn max_by_key<B, F>(self, f: F) -> Option<Self::Item> where F: FnMut(&Self::Item) -> B, B: Ord`

`fn min_by<B, F>(self, f: F) -> Option<Self::Item> where F: FnMut(&Self::Item) -> B, B: Ord`

`fn min_by_key<B, F>(self, f: F) -> Option<Self::Item> where F: FnMut(&Self::Item) -> B, B: Ord`

`fn rev(self) -> Rev<Self> where Self: DoubleEndedIterator`

`fn unzip<A, B, FromA, FromB>(self) -> (FromA, FromB) where FromB: Default + Extend, Self: Iterator<Item=(A, B)>, FromA: Default + Extend<A>`

`fn cloned<'a, T>(self) -> Cloned<Self> where Self: Iterator<Item=&'a T>, T: 'a + Clone`

`fn cycle(self) -> Cycle<Self> where Self: Clone`

`fn sum<S>(self) -> S where S: Add<Self::Item, Output=S> + Zero`

`fn product(self) -> P where P: Mul<Self::Item, Output=P> + One`

`fn cmp(self, other: I) -> Ordering where I: IntoIterator<Item=Self::Item>, Self::Item: Ord`

`fn partial_cmp(self, other: I) -> Option<Ordering> where I: IntoIterator, Self::Item: PartialOrd<I::Item>`

`fn eq(self, other: I) -> bool where I: IntoIterator, Self::Item: PartialEq<I::Item>`

`fn ne(self, other: I) -> bool where I: IntoIterator, Self::Item: PartialEq<I::Item>`

`fn lt(self, other: I) -> bool where I: IntoIterator, Self::Item: PartialOrd<I::Item>`

`fn le(self, other: I) -> bool where I: IntoIterator, Self::Item: PartialOrd<I::Item>`

`fn gt(self, other: I) -> bool where I: IntoIterator, Self::Item: PartialOrd<I::Item>`

`fn ge(self, other: I) -> bool where I: IntoIterator, Self::Item: PartialOrd<I::Item>`

Struct utf8_ranges::Utf8Sequences [−] [src]

Example

Methods

impl Utf8Sequences

fn new(start: char, end: char) -> Self[−]

Trait Implementations

impl Iterator for Utf8Sequences

type Item = Utf8Sequence

fn next(&mut self) -> Option<Self::Item>

fn size_hint(&self) -> (usize, Option<usize>)

fn count(self) -> usize

fn last(self) -> Option<Self::Item>

fn nth(&mut self, n: usize) -> Option<Self::Item>

fn chain<U>(self, other: U) -> Chain<Self, U::IntoIter> where U: IntoIterator<Item=Self::Item>

fn zip<U>(self, other: U) -> Zip<Self, U::IntoIter> where U: IntoIterator

fn map<B, F>(self, f: F) -> Map<Self, F> where F: FnMut(Self::Item) -> B

fn filter<P>(self, predicate: P) -> Filter<Self, P> where P: FnMut(&Self::Item) -> bool

fn filter_map<B, F>(self, f: F) -> FilterMap<Self, F> where F: FnMut(Self::Item) -> Option<B>

fn enumerate(self) -> Enumerate<Self>

fn peekable(self) -> Peekable<Self>

fn skip_while<P>(self, predicate: P) -> SkipWhile<Self, P> where P: FnMut(&Self::Item) -> bool

fn take_while<P>(self, predicate: P) -> TakeWhile<Self, P> where P: FnMut(&Self::Item) -> bool

fn skip(self, n: usize) -> Skip<Self>

fn take(self, n: usize) -> Take<Self>

fn scan<St, B, F>(self, initial_state: St, f: F) -> Scan<Self, St, F> where F: FnMut(&mut St, Self::Item) -> Option<B>

fn flat_map<U, F>(self, f: F) -> FlatMap<Self, U, F> where F: FnMut(Self::Item) -> U, U: IntoIterator

fn fuse(self) -> Fuse<Self>

fn inspect<F>(self, f: F) -> Inspect<Self, F> where F: FnMut(&Self::Item) -> ()

fn by_ref(&mut self) -> &mut Self

fn collect<B>(self) -> B where B: FromIterator<Self::Item>

fn partition<B, F>(self, f: F) -> (B, B) where F: FnMut(&Self::Item) -> bool, B: Default + Extend<Self::Item>

fn fold<B, F>(self, init: B, f: F) -> B where F: FnMut(B, Self::Item) -> B

fn all<F>(&mut self, f: F) -> bool where F: FnMut(Self::Item) -> bool

fn any<F>(&mut self, f: F) -> bool where F: FnMut(Self::Item) -> bool

fn find<P>(&mut self, predicate: P) -> Option<Self::Item> where P: FnMut(&Self::Item) -> bool

fn position<P>(&mut self, predicate: P) -> Option<usize> where P: FnMut(Self::Item) -> bool

fn rposition<P>(&mut self, predicate: P) -> Option<usize> where Self: ExactSizeIterator + DoubleEndedIterator, P: FnMut(Self::Item) -> bool

fn max(self) -> Option<Self::Item> where Self::Item: Ord

fn min(self) -> Option<Self::Item> where Self::Item: Ord

fn max_by<B, F>(self, f: F) -> Option<Self::Item> where B: Ord, F: FnMut(&Self::Item) -> B

fn max_by_key<B, F>(self, f: F) -> Option<Self::Item> where F: FnMut(&Self::Item) -> B, B: Ord

fn min_by<B, F>(self, f: F) -> Option<Self::Item> where F: FnMut(&Self::Item) -> B, B: Ord

fn min_by_key<B, F>(self, f: F) -> Option<Self::Item> where F: FnMut(&Self::Item) -> B, B: Ord

fn rev(self) -> Rev<Self> where Self: DoubleEndedIterator

fn unzip<A, B, FromA, FromB>(self) -> (FromA, FromB) where FromB: Default + Extend<B>, Self: Iterator<Item=(A, B)>, FromA: Default + Extend<A>

fn cloned<'a, T>(self) -> Cloned<Self> where Self: Iterator<Item=&'a T>, T: 'a + Clone

fn cycle(self) -> Cycle<Self> where Self: Clone

fn sum<S>(self) -> S where S: Add<Self::Item, Output=S> + Zero

fn product<P>(self) -> P where P: Mul<Self::Item, Output=P> + One

fn cmp<I>(self, other: I) -> Ordering where I: IntoIterator<Item=Self::Item>, Self::Item: Ord

fn partial_cmp<I>(self, other: I) -> Option<Ordering> where I: IntoIterator, Self::Item: PartialOrd<I::Item>

fn eq<I>(self, other: I) -> bool where I: IntoIterator, Self::Item: PartialEq<I::Item>

fn ne<I>(self, other: I) -> bool where I: IntoIterator, Self::Item: PartialEq<I::Item>

fn lt<I>(self, other: I) -> bool where I: IntoIterator, Self::Item: PartialOrd<I::Item>

fn le<I>(self, other: I) -> bool where I: IntoIterator, Self::Item: PartialOrd<I::Item>

fn gt<I>(self, other: I) -> bool where I: IntoIterator, Self::Item: PartialOrd<I::Item>

fn ge<I>(self, other: I) -> bool where I: IntoIterator, Self::Item: PartialOrd<I::Item>

`impl Utf8Sequences`

`fn new(start: char, end: char) -> Self`[−]

`impl Iterator for Utf8Sequences`

`type Item = Utf8Sequence`

`fn next(&mut self) -> Option<Self::Item>`

`fn size_hint(&self) -> (usize, Option<usize>)`

`fn count(self) -> usize`

`fn last(self) -> Option<Self::Item>`

`fn nth(&mut self, n: usize) -> Option<Self::Item>`

`fn chain<U>(self, other: U) -> Chain<Self, U::IntoIter> where U: IntoIterator<Item=Self::Item>`

`fn zip<U>(self, other: U) -> Zip<Self, U::IntoIter> where U: IntoIterator`

`fn map<B, F>(self, f: F) -> Map<Self, F> where F: FnMut(Self::Item) -> B`

`fn filter<P>(self, predicate: P) -> Filter<Self, P> where P: FnMut(&Self::Item) -> bool`

`fn filter_map<B, F>(self, f: F) -> FilterMap<Self, F> where F: FnMut(Self::Item) -> Option<B>`

`fn enumerate(self) -> Enumerate<Self>`

`fn peekable(self) -> Peekable<Self>`

`fn skip_while<P>(self, predicate: P) -> SkipWhile<Self, P> where P: FnMut(&Self::Item) -> bool`

`fn take_while<P>(self, predicate: P) -> TakeWhile<Self, P> where P: FnMut(&Self::Item) -> bool`

`fn skip(self, n: usize) -> Skip<Self>`

`fn take(self, n: usize) -> Take<Self>`

`fn scan<St, B, F>(self, initial_state: St, f: F) -> Scan<Self, St, F> where F: FnMut(&mut St, Self::Item) -> Option<B>`

`fn flat_map<U, F>(self, f: F) -> FlatMap<Self, U, F> where F: FnMut(Self::Item) -> U, U: IntoIterator`

`fn fuse(self) -> Fuse<Self>`

`fn inspect<F>(self, f: F) -> Inspect<Self, F> where F: FnMut(&Self::Item) -> ()`

`fn by_ref(&mut self) -> &mut Self`

`fn collect<B>(self) -> B where B: FromIterator<Self::Item>`

`fn partition<B, F>(self, f: F) -> (B, B) where F: FnMut(&Self::Item) -> bool, B: Default + Extend<Self::Item>`

`fn fold<B, F>(self, init: B, f: F) -> B where F: FnMut(B, Self::Item) -> B`

`fn all<F>(&mut self, f: F) -> bool where F: FnMut(Self::Item) -> bool`

`fn any<F>(&mut self, f: F) -> bool where F: FnMut(Self::Item) -> bool`

`fn find<P>(&mut self, predicate: P) -> Option<Self::Item> where P: FnMut(&Self::Item) -> bool`

`fn position<P>(&mut self, predicate: P) -> Option<usize> where P: FnMut(Self::Item) -> bool`

`fn rposition<P>(&mut self, predicate: P) -> Option<usize> where Self: ExactSizeIterator + DoubleEndedIterator, P: FnMut(Self::Item) -> bool`

`fn max(self) -> Option<Self::Item> where Self::Item: Ord`

`fn min(self) -> Option<Self::Item> where Self::Item: Ord`

`fn max_by<B, F>(self, f: F) -> Option<Self::Item> where B: Ord, F: FnMut(&Self::Item) -> B`

`fn max_by_key<B, F>(self, f: F) -> Option<Self::Item> where F: FnMut(&Self::Item) -> B, B: Ord`

`fn min_by<B, F>(self, f: F) -> Option<Self::Item> where F: FnMut(&Self::Item) -> B, B: Ord`

`fn min_by_key<B, F>(self, f: F) -> Option<Self::Item> where F: FnMut(&Self::Item) -> B, B: Ord`

`fn rev(self) -> Rev<Self> where Self: DoubleEndedIterator`

`fn unzip<A, B, FromA, FromB>(self) -> (FromA, FromB) where FromB: Default + Extend<B>, Self: Iterator<Item=(A, B)>, FromA: Default + Extend<A>`

`fn cloned<'a, T>(self) -> Cloned<Self> where Self: Iterator<Item=&'a T>, T: 'a + Clone`

`fn cycle(self) -> Cycle<Self> where Self: Clone`

`fn sum<S>(self) -> S where S: Add<Self::Item, Output=S> + Zero`

`fn product<P>(self) -> P where P: Mul<Self::Item, Output=P> + One`

`fn cmp<I>(self, other: I) -> Ordering where I: IntoIterator<Item=Self::Item>, Self::Item: Ord`

`fn partial_cmp<I>(self, other: I) -> Option<Ordering> where I: IntoIterator, Self::Item: PartialOrd<I::Item>`

`fn eq<I>(self, other: I) -> bool where I: IntoIterator, Self::Item: PartialEq<I::Item>`

`fn ne<I>(self, other: I) -> bool where I: IntoIterator, Self::Item: PartialEq<I::Item>`

`fn lt<I>(self, other: I) -> bool where I: IntoIterator, Self::Item: PartialOrd<I::Item>`

`fn le<I>(self, other: I) -> bool where I: IntoIterator, Self::Item: PartialOrd<I::Item>`

`fn gt<I>(self, other: I) -> bool where I: IntoIterator, Self::Item: PartialOrd<I::Item>`

`fn ge<I>(self, other: I) -> bool where I: IntoIterator, Self::Item: PartialOrd<I::Item>`