1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
|
//! Low-level char-based scanner.
use std::fmt::{self, Debug, Formatter};
use std::slice::SliceIndex;
use std::str::Chars;
/// A low-level featureful char scanner.
pub struct Scanner<'s> {
src: &'s str,
iter: Chars<'s>,
index: usize,
}
impl<'s> Scanner<'s> {
/// Create a new char scanner.
pub fn new(src: &'s str) -> Self {
Self { src, iter: src.chars(), index: 0 }
}
/// Consume the next char.
pub fn eat(&mut self) -> Option<char> {
let next = self.iter.next();
if let Some(c) = next {
self.index += c.len_utf8();
}
next
}
/// Consume the next char if it is the given one.
///
/// Returns whether the char was consumed.
pub fn eat_if(&mut self, c: char) -> bool {
// Don't decode the char twice through peek() and eat().
//
// TODO: Benchmark this vs. the naive version.
if self.iter.next() == Some(c) {
self.index += c.len_utf8();
true
} else {
self.reset();
false
}
}
/// Consume the next char, debug-asserting that it is the given one.
pub fn eat_assert(&mut self, c: char) {
let next = self.eat();
debug_assert_eq!(next, Some(c));
}
/// Consume the next char, coalescing `\r\n` to just `\n`.
pub fn eat_merging_crlf(&mut self) -> Option<char> {
let c = self.eat();
if c == Some('\r') && self.eat_if('\n') {
Some('\n')
} else {
c
}
}
/// Eat chars while the condition is true.
pub fn eat_while(&mut self, mut f: impl FnMut(char) -> bool) -> &'s str {
self.eat_until(|c| !f(c))
}
/// Eat chars until the condition is true.
pub fn eat_until(&mut self, mut f: impl FnMut(char) -> bool) -> &'s str {
let start = self.index;
while let Some(c) = self.iter.next() {
if f(c) {
// Undo the previous `next()` without peeking all the time
// during iteration.
//
// TODO: Benchmark this vs. the naive peeking version.
self.reset();
break;
}
self.index += c.len_utf8();
}
&self.src[start .. self.index]
}
/// Uneat the last eaten character.
pub fn uneat(&mut self) {
self.index = self.prev_index();
self.reset();
}
/// Peek at the next char without consuming it.
pub fn peek(&self) -> Option<char> {
self.iter.clone().next()
}
/// Peek at the nth-next char without consuming anything.
pub fn peek_nth(&self, n: usize) -> Option<char> {
self.iter.clone().nth(n)
}
/// Checks whether the next character fulfills a condition.
///
/// Returns `false` is there is no next character.
pub fn check(&self, f: impl FnMut(char) -> bool) -> bool {
self.peek().map(f).unwrap_or(false)
}
/// Go back to the where the index says.
fn reset(&mut self) {
self.iter = self.src[self.index ..].chars();
}
}
impl<'s> Scanner<'s> {
/// The current index in the string.
pub fn index(&self) -> usize {
self.index
}
/// The previous index in the string.
pub fn prev_index(&self) -> usize {
self.src[.. self.index]
.chars()
.next_back()
.map(|c| self.index - c.len_utf8())
.unwrap_or(0)
}
/// Slice a part out of the source string.
pub fn get<I>(&self, index: I) -> &'s str
where
I: SliceIndex<str, Output = str>,
{
&self.src[index]
}
/// The full source string.
pub fn src(&self) -> &'s str {
self.src
}
/// The full source string up to the current index.
pub fn eaten(&self) -> &'s str {
&self.src[.. self.index]
}
/// The source string from `start` to the current index.
pub fn eaten_from(&self, start: usize) -> &'s str {
&self.src[start .. self.index]
}
/// The remaining source string after the current index.
pub fn rest(&self) -> &'s str {
&self.src[self.index ..]
}
}
impl Debug for Scanner<'_> {
fn fmt(&self, f: &mut Formatter) -> fmt::Result {
write!(f, "Scanner({}|{})", self.eaten(), self.rest())
}
}
|