prevent creation of tokens for each text that seems like markup

This commit is contained in:
Guilhem Fauré 2023-04-27 16:25:23 +02:00
parent d30e8d07ee
commit 9a5735c046

View File

@ -52,20 +52,18 @@ closing_tag: _O_ANGLE _SLASH TEXT ( _PIPE TEXT )? _C_ANGLE -> closing_tag
opening_tag: _O_ANGLE TEXT ( _PIPE TEXT )? _C_ANGLE -> opening_tag opening_tag: _O_ANGLE TEXT ( _PIPE TEXT )? _C_ANGLE -> opening_tag
// Terminals // Terminals
/// Windows or Unix line breaks
_N: /\r?\n/ _N: /\r?\n/
SEPARATOR: "----" "-"*
TEXT: ( PURE_TEXT | AMBIGUOUS_TEXT )+
/// Blocks
_HYPHEN_STAR: "-*" _HYPHEN_STAR: "-*"
_HYPHEN_HASH: "-#" _HYPHEN_HASH: "-#"
_PIPE: "|" _PIPE: "|"
_SLASH: "/" _SLASH: "/"
_O_ANGLE: "<" _O_ANGLE: "<"
_C_ANGLE: ">" _C_ANGLE: ">"
/// Opening angle bracket followed by text and not followed by a closing tag
_ORPHAN_OPENING: /<(?=([^>\/]+?)>)(?!.*<\/\1>)/ _ORPHAN_OPENING: /<(?=([^>\/]+?)>)(?!.*<\/\1>)/
/// Markup
_O_CURLY_3: "{{{" _O_CURLY_3: "{{{"
_C_CURLY_3: "}}}" _C_CURLY_3: "}}}"
_O_CURLY_2: "{{" _O_CURLY_2: "{{"
@ -73,39 +71,17 @@ _C_CURLY_2: "}}"
_O_CURLY: "{" _O_CURLY: "{"
_C_CURLY: "}" _C_CURLY: "}"
/// Links
_O_SQUARE_2: "[[" _O_SQUARE_2: "[["
_C_SQUARE_2: "]]" _C_SQUARE_2: "]]"
_O_SQUARE_INTERO: "[?" _O_SQUARE_INTERO: "[?"
_C_SQUARE: "]" _C_SQUARE: "]"
_ARROW: "->" _ARROW: "->"
/// Opening square bracket followed by text and an hyphen angle bracket arrow _LINK_OPENING: /\[(?=/ PURE_TEXT+ /]*->)/
_LINK_OPENING: /\[(?=[^\r\n\[\]]*->)/ HREF: PURE_TEXT+
LINK_TEXT: PURE_TEXT /+(?=->)/
/// Content /// Every characters that have no markup meaning
SEPARATOR: "----" "-"* PURE_TEXT: /[^\r\n\|\{\}\[\]\<\>]/
/// Characters that could be markup but arent in this situation
/// Text AMBIGUOUS_TEXT: /\[(?!.*->.*\])/
// - Dont contains line breaks
// - Dont contains any markup element…
// - EXCEPTED when they are used as in regular text
TEXT: /[^\r\n\|\{\}\[\]\<\>]+/
| /\[(?!.*->.*\])/
| /\]/ | /\]/
/// Inner text :
// - Dont contains line breaks
// - Dont contains markup closing right curly braces
// INNER_TEXT: /[^\r\n\}]+/
/// Link href :
// - Dont contains line breaks
// - Dont contains markup closing right square brackets
// HREF: /[^\r\n\]]+/
HREF: TEXT
/// Link text :
// - Dont contains line breaks
// - Dont contains an opening or closing square bracket
// - Dont contains an hyphen angle bracket arrow ( -> )
LINK_TEXT: /[^\r\n\[\]]+(?=->)/