summaryrefslogtreecommitdiff
path: root/src/parse
diff options
context:
space:
mode:
authorLaurenz <laurmaedje@gmail.com>2021-07-08 20:03:13 +0200
committerLaurenz <laurmaedje@gmail.com>2021-07-08 20:03:13 +0200
commit5c327e249e03ac303e7fef40e2df6c6ef834db66 (patch)
tree44e60f7ed494e1e6452f378620baa4afbc755346 /src/parse
parentf85e5aac64784deac75950a1307f2ca802ad6765 (diff)
Switch to = for headings once again
Diffstat (limited to 'src/parse')
-rw-r--r--src/parse/mod.rs10
-rw-r--r--src/parse/scanner.rs6
-rw-r--r--src/parse/tokens.rs51
3 files changed, 34 insertions, 33 deletions
diff --git a/src/parse/mod.rs b/src/parse/mod.rs
index bdecc31f..1d893ad9 100644
--- a/src/parse/mod.rs
+++ b/src/parse/mod.rs
@@ -102,14 +102,12 @@ fn node(p: &mut Parser, at_start: &mut bool) -> Option<Node> {
Token::Star => Node::Strong(span),
Token::Underscore => Node::Emph(span),
Token::Raw(t) => raw(p, t),
- Token::Hashtag if *at_start => return Some(heading(p)),
+ Token::Eq if *at_start => return Some(heading(p)),
Token::Hyph if *at_start => return Some(list_item(p)),
Token::Numbering(number) if *at_start => return Some(enum_item(p, number)),
// Line-based markup that is not currently at the start of the line.
- Token::Hashtag | Token::Hyph | Token::Numbering(_) => {
- Node::Text(p.peek_src().into())
- }
+ Token::Eq | Token::Hyph | Token::Numbering(_) => Node::Text(p.peek_src().into()),
// Hashtag + keyword / identifier.
Token::Ident(_)
@@ -183,11 +181,11 @@ fn raw(p: &mut Parser, token: RawToken) -> Node {
/// Parse a heading.
fn heading(p: &mut Parser) -> Node {
let start = p.next_start();
- p.assert(Token::Hashtag);
+ p.assert(Token::Eq);
// Count depth.
let mut level: usize = 1;
- while p.eat_if(Token::Hashtag) {
+ while p.eat_if(Token::Eq) {
level += 1;
}
diff --git a/src/parse/scanner.rs b/src/parse/scanner.rs
index fad44e89..af88aa68 100644
--- a/src/parse/scanner.rs
+++ b/src/parse/scanner.rs
@@ -88,12 +88,12 @@ impl<'s> Scanner<'s> {
/// Checks whether the next char fulfills a condition.
///
- /// Returns `false` if there is no next char.
- pub fn check<F>(&self, f: F) -> bool
+ /// Returns `default` if there is no next char.
+ pub fn check_or<F>(&self, default: bool, f: F) -> bool
where
F: FnOnce(char) -> bool,
{
- self.peek().map(f).unwrap_or(false)
+ self.peek().map_or(default, f)
}
/// The previous index in the source string.
diff --git a/src/parse/tokens.rs b/src/parse/tokens.rs
index f2196740..aebe7b70 100644
--- a/src/parse/tokens.rs
+++ b/src/parse/tokens.rs
@@ -89,19 +89,22 @@ impl<'s> Iterator for Tokens<'s> {
impl<'s> Tokens<'s> {
fn markup(&mut self, start: usize, c: char) -> Token<'s> {
match c {
+ // Escape sequences.
+ '\\' => self.backslash(),
+
+ // Keywords and identifiers.
+ '#' => self.hash(),
+
// Markup.
'~' => Token::Tilde,
'*' => Token::Star,
'_' => Token::Underscore,
- '\\' => self.backslash(),
'`' => self.raw(),
'$' => self.math(),
'-' => self.hyph(start),
+ '=' if self.s.check_or(true, |c| c == '=' || c.is_whitespace()) => Token::Eq,
c if c == '.' || c.is_ascii_digit() => self.numbering(start, c),
- // Headings, keywords and identifiers.
- '#' => self.hash(start),
-
// Plain text.
_ => self.text(start),
}
@@ -143,7 +146,7 @@ impl<'s> Tokens<'s> {
// Numbers.
c if c.is_ascii_digit()
- || (c == '.' && self.s.check(|n| n.is_ascii_digit())) =>
+ || (c == '.' && self.s.check_or(false, |n| n.is_ascii_digit())) =>
{
self.number(start, c)
}
@@ -157,7 +160,7 @@ impl<'s> Tokens<'s> {
fn whitespace(&mut self, first: char) -> Token<'s> {
// Fast path for just a single space
- if first == ' ' && !self.s.check(char::is_whitespace) {
+ if first == ' ' && self.s.check_or(true, |c| !c.is_whitespace()) {
Token::Space(0)
} else {
self.s.uneat();
@@ -188,8 +191,10 @@ impl<'s> Tokens<'s> {
'/' => true,
// Parentheses.
'[' | ']' | '{' | '}' => true,
+ // Code.
+ '#' => true,
// Markup.
- '#' | '~' | '*' | '_' | '`' | '$' | '-' => true,
+ '~' | '*' | '_' | '`' | '$' | '-' => true,
// Escaping.
'\\' => true,
// Just text.
@@ -233,18 +238,16 @@ impl<'s> Tokens<'s> {
}
}
- fn hash(&mut self, start: usize) -> Token<'s> {
- if self.s.check(is_id_start) {
+ fn hash(&mut self) -> Token<'s> {
+ if self.s.check_or(false, is_id_start) {
let read = self.s.eat_while(is_id_continue);
if let Some(keyword) = keyword(read) {
keyword
} else {
Token::Ident(read)
}
- } else if self.s.check(|c| c != '#' && !c.is_whitespace()) {
- Token::Text(self.s.eaten_from(start))
} else {
- Token::Hashtag
+ Token::Invalid("#")
}
}
@@ -255,10 +258,10 @@ impl<'s> Tokens<'s> {
} else {
Token::HyphHyph
}
- } else if self.s.check(|c| !c.is_whitespace()) {
- Token::Text(self.s.eaten_from(start))
- } else {
+ } else if self.s.check_or(true, char::is_whitespace) {
Token::Hyph
+ } else {
+ Token::Text(self.s.eaten_from(start))
}
}
@@ -274,11 +277,11 @@ impl<'s> Tokens<'s> {
None
};
- if self.s.check(|c| !c.is_whitespace()) {
- return Token::Text(self.s.eaten_from(start));
+ if self.s.check_or(true, char::is_whitespace) {
+ Token::Numbering(number)
+ } else {
+ Token::Text(self.s.eaten_from(start))
}
-
- Token::Numbering(number)
}
fn raw(&mut self) -> Token<'s> {
@@ -663,8 +666,8 @@ mod tests {
// Test code symbols in text.
t!(Markup[" /"]: "a():\"b" => Text("a():\"b"));
t!(Markup[" /"]: ";:,|/+" => Text(";:,|"), Text("/+"));
- t!(Markup[" /"]: "#-a" => Text("#"), Text("-"), Text("a"));
- t!(Markup[" "]: "#123" => Text("#"), Text("123"));
+ t!(Markup[" /"]: "=-a" => Text("="), Text("-"), Text("a"));
+ t!(Markup[" "]: "#123" => Invalid("#"), Text("123"));
// Test text ends.
t!(Markup[""]: "hello " => Text("hello"), Space(0));
@@ -712,8 +715,8 @@ mod tests {
// Test markup tokens.
t!(Markup[" a1"]: "*" => Star);
t!(Markup: "_" => Underscore);
- t!(Markup[""]: "###" => Hashtag, Hashtag, Hashtag);
- t!(Markup["a1/"]: "# " => Hashtag, Space(0));
+ t!(Markup[""]: "===" => Eq, Eq, Eq);
+ t!(Markup["a1/"]: "= " => Eq, Space(0));
t!(Markup: "~" => Tilde);
t!(Markup[" "]: r"\" => Backslash);
t!(Markup["a "]: r"a--" => Text("a"), HyphHyph);
@@ -776,7 +779,7 @@ mod tests {
for &(s, t) in &list {
t!(Markup[" "]: format!("#{}", s) => t);
t!(Markup[" "]: format!("#{0}#{0}", s) => t, t);
- t!(Markup[" /"]: format!("# {}", s) => Token::Hashtag, Space(0), Text(s));
+ t!(Markup[" /"]: format!("# {}", s) => Token::Invalid("#"), Space(0), Text(s));
}
for &(s, t) in &list {