mdz_helpers.ts

Shared constants and pure helper functions for mdz parsers.
Used by both the single-pass parser (mdz.ts) and the two-phase
lexer+parser (mdz_lexer.ts + mdz_token_parser.ts).

Declarations
#

48 declarations

view source

A_LOWER
#

mdz_helpers.ts view source

97

A_UPPER
#

mdz_helpers.ts view source

65

AMPERSAND
#

mdz_helpers.ts view source

38

APOSTROPHE
#

mdz_helpers.ts view source

39

ASTERISK
#

mdz_helpers.ts view source

42

AT
#

mdz_helpers.ts view source

64

BACKTICK
#

mdz_helpers.ts view source

96

COLON
#

mdz_helpers.ts view source

58

COMMA
#

mdz_helpers.ts view source

44

DOLLAR
#

mdz_helpers.ts view source

36

EQUALS
#

mdz_helpers.ts view source

61

EXCLAMATION
#

mdz_helpers.ts view source

33

extract_single_tag
#

mdz_helpers.ts view source

(nodes: MdzNode[]): MdzElementNode | MdzComponentNode | null

`nodes`

type MdzNode[]

returns

MdzElementNode | MdzComponentNode | null

HASH
#

mdz_helpers.ts view source

35

HR_HYPHEN_COUNT
#

mdz_helpers.ts view source

3

HTTP_PREFIX_LENGTH
#

mdz_helpers.ts view source

7

HTTPS_PREFIX_LENGTH
#

mdz_helpers.ts view source

8

HYPHEN
#

mdz_helpers.ts view source

45

is_at_absolute_path
#

mdz_helpers.ts view source

(text: string, index: number): boolean

Check if position in text is the start of an absolute path (starts with /).
Must be preceded by whitespace or be at the start of the string.
Rejects // (comments/protocol-relative) and /  (bare slash).

`text`

type string

`index`

type number

returns

boolean

is_at_relative_path
#

mdz_helpers.ts view source

(text: string, index: number): boolean

Check if position in text is the start of a relative path (./ or ../).
Must be preceded by whitespace or be at the start of the string.
Requires at least one path character after the prefix.

`text`

type string

`index`

type number

returns

boolean

is_letter
#

mdz_helpers.ts view source

(char_code: number): boolean

Check if character code is a letter (A-Z, a-z).

`char_code`

type number

returns

boolean

is_tag_name_char
#

mdz_helpers.ts view source

(char_code: number): boolean

Check if character code is valid for tag name (letter, number, hyphen, underscore).

`char_code`

type number

returns

boolean

is_valid_path_char
#

mdz_helpers.ts view source

(char_code: number): boolean

Check if character code is valid in URI path per RFC 3986.
Validates against the pchar production plus path/query/fragment separators.
Valid characters:
- unreserved: A-Z a-z 0-9 - . _ ~
- sub-delims: ! $ & ' ( ) * + , ; =
- path allowed: : @
- separators: / ? #
- percent-encoding: %

`char_code`

type number

returns

boolean

is_word_char
#

mdz_helpers.ts view source

(char_code: number): boolean

Check if character is part of a word for word boundary detection.
Used to prevent intraword emphasis with _ and ~ delimiters.
Formatting delimiters (*, _, ~) are NOT word characters - they're transparent.
Only alphanumeric characters (A-Z, a-z, 0-9) are considered word characters.
This prevents false positives with snake_case identifiers while allowing
adjacent formatting like **bold**_italic_.

`char_code`

type number

returns

boolean

LEFT_ANGLE
#

mdz_helpers.ts view source

60

LEFT_BRACKET
#

mdz_helpers.ts view source

91

LEFT_PAREN
#

mdz_helpers.ts view source

40

MAX_HEADING_LEVEL
#

mdz_helpers.ts view source

6

MIN_CODEBLOCK_BACKTICKS
#

mdz_helpers.ts view source

3

NEWLINE
#

mdz_helpers.ts view source

10

NINE
#

mdz_helpers.ts view source

57

PERCENT
#

mdz_helpers.ts view source

37

PERIOD
#

mdz_helpers.ts view source

46

PLUS
#

mdz_helpers.ts view source

43

QUESTION
#

mdz_helpers.ts view source

63

RIGHT_ANGLE
#

mdz_helpers.ts view source

62

RIGHT_BRACKET
#

mdz_helpers.ts view source

93

RIGHT_PAREN
#

mdz_helpers.ts view source

41

SEMICOLON
#

mdz_helpers.ts view source

59

SLASH
#

mdz_helpers.ts view source

47

SPACE
#

mdz_helpers.ts view source

32

TAB
#

mdz_helpers.ts view source

9

TILDE
#

mdz_helpers.ts view source

126

trim_trailing_punctuation
#

mdz_helpers.ts view source

(url: string): string

Trim trailing punctuation from URL/path per RFC 3986 and GFM rules.
- Trims simple trailing: .,;:!?]
- Balanced logic for () only (valid in path components)
- Invalid chars like [] {} are already stopped by whitelist, but ] trimmed as fallback
Optimized to avoid O(n²) string slicing - tracks end index and slices once at the end.

`url`

type string

returns

string

UNDERSCORE
#

mdz_helpers.ts view source

95

Z_LOWER
#

mdz_helpers.ts view source

122

Z_UPPER
#

mdz_helpers.ts view source

90

ZERO
#

mdz_helpers.ts view source

48