//! Character escapes are a construct that occurs in the [string][] and //! [text][] content types. //! //! They’re formed with the following BNF: //! //! ```bnf //! character_escape ::= '\\' ascii_punctuation //! ``` //! //! Like much of markdown, there are no “invalid” character escapes: just a //! slash, or a slash followed by anything other than an ASCII punctuation //! character, is exactly that: just a slash. //! To escape (most) arbitrary characters, use a //! [character reference][character_reference] instead //! (as in, `&`, `{`, or say ` `). //! It is also possible to escape a line ending in text with a similar //! construct: a [hard break (escape)][hard_break_escape] is a backslash followed //! by a line ending (that is part of the construct instead of ending it). //! //! ## Tokens //! //! * [`CharacterEscape`][Name::CharacterEscape] //! * [`CharacterEscapeMarker`][Name::CharacterEscapeMarker] //! * [`CharacterEscapeValue`][Name::CharacterEscapeValue] //! //! ## References //! //! * [`character-escape.js` in `micromark`](https://github.com/micromark/micromark/blob/main/packages/micromark-core-commonmark/dev/lib/character-escape.js) //! * [*§ 2.4 Backslash escapes* in `CommonMark`](https://spec.commonmark.org/0.30/#backslash-escapes) //! //! [string]: crate::construct::string //! [text]: crate::construct::text //! [character_reference]: crate::construct::character_reference //! [hard_break_escape]: crate::construct::hard_break_escape use crate::event::Name; use crate::state::{Name as StateName, State}; use crate::tokenizer::Tokenizer; /// Start of character escape. /// /// ```markdown /// > | a\*b /// ^ /// ``` pub fn start(tokenizer: &mut Tokenizer) -> State { if tokenizer.parse_state.constructs.character_escape && tokenizer.current == Some(b'\\') { tokenizer.enter(Name::CharacterEscape); tokenizer.enter(Name::CharacterEscapeMarker); tokenizer.consume(); tokenizer.exit(Name::CharacterEscapeMarker); State::Next(StateName::CharacterEscapeInside) } else { State::Nok } } /// After `\`, at punctuation. /// /// ```markdown /// > | a\*b /// ^ /// ``` pub fn inside(tokenizer: &mut Tokenizer) -> State { match tokenizer.current { // ASCII punctuation. Some(b'!'..=b'/' | b':'..=b'@' | b'['..=b'`' | b'{'..=b'~') => { tokenizer.enter(Name::CharacterEscapeValue); tokenizer.consume(); tokenizer.exit(Name::CharacterEscapeValue); tokenizer.exit(Name::CharacterEscape); State::Ok } _ => State::Nok, } }