xref: /dokuwiki/_test/tests/Parsing/Markdown/gfm-spec/skip.php (revision eb15e634e1400f6c4d78f5fb40179ca25f41574d)
172b2703bSAndreas Gohr<?php
272b2703bSAndreas Gohr
372b2703bSAndreas Gohr/**
472b2703bSAndreas Gohr * GFM spec examples that GfmSpecTest should skip, keyed by example number
572b2703bSAndreas Gohr * (as numbered in spec.txt / the rendered spec).
672b2703bSAndreas Gohr *
772b2703bSAndreas Gohr * Add entries here ONLY for behavior DokuWiki has explicitly decided not to
872b2703bSAndreas Gohr * implement — not for features that are merely pending. Unimplemented
972b2703bSAndreas Gohr * features should show as real failures so they remain visible TODOs on
1072b2703bSAndreas Gohr * the branch.
1172b2703bSAndreas Gohr *
1272b2703bSAndreas Gohr * Each value is a short human-readable reason that will appear in phpunit's
1372b2703bSAndreas Gohr * skip output.
1472b2703bSAndreas Gohr */
1572b2703bSAndreas Gohr
1672b2703bSAndreas Gohrreturn [
1772b2703bSAndreas Gohr    // --------------------------------------------------------------------
183e6baeffSAndreas Gohr    // Thematic breaks (GfmHr) — strict-only HR is intentional. The
193e6baeffSAndreas Gohr    // delimiter run must be bare: no leading, trailing, or internal
203e6baeffSAndreas Gohr    // whitespace in either DW or GFM flavor. The list-precedence cases
213e6baeffSAndreas Gohr    // additionally need a GfmListblock guard that is out of scope.
223e6baeffSAndreas Gohr    // --------------------------------------------------------------------
233e6baeffSAndreas Gohr    17 => 'thematic break: 0-3 spaces of leading indent. Strict policy:'
243e6baeffSAndreas Gohr        . ' opener must be at column 0 in either flavor.',
253e6baeffSAndreas Gohr    21 => 'thematic break: spaces between delimiter chars (`- - -`).'
263e6baeffSAndreas Gohr        . ' Strict policy: bare run only.',
273e6baeffSAndreas Gohr    22 => 'thematic break: spaces between delimiter chars (`** * **`).'
283e6baeffSAndreas Gohr        . ' Strict policy: bare run only.',
293e6baeffSAndreas Gohr    23 => 'thematic break: spaces between delimiter chars (`-     -`).'
303e6baeffSAndreas Gohr        . ' Strict policy: bare run only.',
313e6baeffSAndreas Gohr    24 => 'thematic break: trailing spaces after the run. Strict policy:'
323e6baeffSAndreas Gohr        . ' bare run only.',
333e6baeffSAndreas Gohr    29 => 'thematic break: Setext heading underline `Foo\n---` should'
343e6baeffSAndreas Gohr        . ' render as `<h2>`. Setext headings are deliberately not'
353e6baeffSAndreas Gohr        . ' supported — `---` collides with DokuWiki HR and `===` would'
363e6baeffSAndreas Gohr        . ' collide with DokuWiki heading syntax.',
373e6baeffSAndreas Gohr    30 => 'thematic break vs. list-item precedence (`* * *` between list'
383e6baeffSAndreas Gohr        . ' items): requires internal-space HR support and a GfmListblock'
393e6baeffSAndreas Gohr        . ' guard so the list refuses to absorb the HR-shaped line. Both'
403e6baeffSAndreas Gohr        . ' out of scope; the line stays a list-item body.',
413e6baeffSAndreas Gohr    31 => 'thematic break inside list with different bullet (`- * * *`):'
423e6baeffSAndreas Gohr        . ' depends on internal-space HR support inside the sub-parsed'
433e6baeffSAndreas Gohr        . ' item body. See example 30.',
443e6baeffSAndreas Gohr
453e6baeffSAndreas Gohr    // --------------------------------------------------------------------
46b414dba2SAndreas Gohr    // Setext headings (§4.3) — deliberately not supported across the
47b414dba2SAndreas Gohr    // whole section. The `---` underline collides with DokuWiki\'s HR
48b414dba2SAndreas Gohr    // syntax and `===` would collide with DokuWiki\'s heading delimiter.
49b414dba2SAndreas Gohr    // Same rationale as #29 (thematic break vs. Setext underline),
50b414dba2SAndreas Gohr    // #111 (fence after Setext), and #212 (Setext after blockquote).
51b414dba2SAndreas Gohr    //
52b414dba2SAndreas Gohr    // Examples #62, #64, #67, #68, #69, #71, #74 are NOT listed: those
53b414dba2SAndreas Gohr    // are cases where Setext is deliberately NOT triggered (blockquote /
54b414dba2SAndreas Gohr    // list / paragraph wins, or blank lines disambiguate), so the spec
55b414dba2SAndreas Gohr    // output matches DokuWiki\'s no-Setext rendering and they pass
56b414dba2SAndreas Gohr    // naturally.
57b414dba2SAndreas Gohr    //
58b414dba2SAndreas Gohr    // #58 and #75 also depend on DokuWiki\'s strict-bare-run HR rule
59b414dba2SAndreas Gohr    // (`--- -` and `* * *` need internal-space HR, see #21-23) — they
60b414dba2SAndreas Gohr    // sit in the Setext section because the spec uses them to
61b414dba2SAndreas Gohr    // illustrate Setext-underline edge cases.
62b414dba2SAndreas Gohr    // --------------------------------------------------------------------
63b414dba2SAndreas Gohr    50 => 'Setext heading (`Foo *bar*\n=====` / `\n-----`): Setext'
64b414dba2SAndreas Gohr        . ' headings deliberately not supported — `---`/`===` underlines'
65b414dba2SAndreas Gohr        . ' collide with DokuWiki HR / heading syntax.',
66b414dba2SAndreas Gohr    51 => 'Setext heading with multi-line content: Setext headings'
67b414dba2SAndreas Gohr        . ' deliberately not supported (see #50).',
68b414dba2SAndreas Gohr    52 => 'Setext heading with indented multi-line content: Setext'
69b414dba2SAndreas Gohr        . ' headings deliberately not supported (see #50).',
70b414dba2SAndreas Gohr    53 => 'Setext heading with any-length underline: Setext headings'
71b414dba2SAndreas Gohr        . ' deliberately not supported (see #50).',
72b414dba2SAndreas Gohr    54 => 'Setext heading with 3-space-indented content / underline:'
73b414dba2SAndreas Gohr        . ' Setext headings deliberately not supported (see #50).',
74b414dba2SAndreas Gohr    55 => 'Setext heading: 4-space-indented content forms code block,'
75b414dba2SAndreas Gohr        . ' then `---` HR. Setext headings deliberately not supported'
76b414dba2SAndreas Gohr        . ' (see #50).',
77b414dba2SAndreas Gohr    56 => 'Setext heading: underline indented up to 3 spaces with'
78b414dba2SAndreas Gohr        . ' trailing spaces. Setext headings deliberately not'
79b414dba2SAndreas Gohr        . ' supported (see #50).',
80b414dba2SAndreas Gohr    57 => 'Setext heading vs. 4-space-indented underline (paragraph'
81b414dba2SAndreas Gohr        . ' wins). Setext headings deliberately not supported (see #50).',
82b414dba2SAndreas Gohr    58 => 'Setext heading: underline cannot contain internal spaces'
83b414dba2SAndreas Gohr        . ' (`= =` / `--- -`). Setext headings deliberately not supported'
84b414dba2SAndreas Gohr        . ' (see #50); also depends on internal-space HR support DokuWiki'
85b414dba2SAndreas Gohr        . ' lacks (see #21-23).',
86b414dba2SAndreas Gohr    59 => 'Setext heading: trailing spaces in content do not cause a'
87b414dba2SAndreas Gohr        . ' line break. Setext headings deliberately not supported (see'
88b414dba2SAndreas Gohr        . ' #50).',
89b414dba2SAndreas Gohr    60 => 'Setext heading: trailing backslash in content. Setext'
90b414dba2SAndreas Gohr        . ' headings deliberately not supported (see #50).',
91b414dba2SAndreas Gohr    61 => 'Setext heading: block-structure precedence over inline.'
92b414dba2SAndreas Gohr        . ' Setext headings deliberately not supported (see #50).',
93b414dba2SAndreas Gohr    63 => 'Setext heading: underline cannot be a lazy continuation in'
94b414dba2SAndreas Gohr        . ' a blockquote. Setext headings deliberately not supported'
95b414dba2SAndreas Gohr        . ' (see #50).',
96b414dba2SAndreas Gohr    65 => 'Setext heading: preceding paragraph becomes part of heading'
97b414dba2SAndreas Gohr        . ' content. Setext headings deliberately not supported (see #50).',
98b414dba2SAndreas Gohr    66 => 'Setext heading: no blank line required before/after. Setext'
99b414dba2SAndreas Gohr        . ' headings deliberately not supported (see #50).',
100b414dba2SAndreas Gohr    70 => 'Setext heading: 4-space-indented content forms code block,'
101b414dba2SAndreas Gohr        . ' then `---` HR. Setext headings deliberately not supported'
102b414dba2SAndreas Gohr        . ' (see #50).',
103b414dba2SAndreas Gohr    72 => 'Setext heading with backslash-escaped marker `\\> foo`.'
104b414dba2SAndreas Gohr        . ' Setext headings deliberately not supported (see #50).',
105b414dba2SAndreas Gohr    73 => 'Setext heading: blank-line-separated paragraph + heading +'
106b414dba2SAndreas Gohr        . ' paragraph. Setext headings deliberately not supported (see'
107b414dba2SAndreas Gohr        . ' #50).',
108b414dba2SAndreas Gohr    75 => 'Setext heading boundary: `* * *` should be HR (cannot count'
109b414dba2SAndreas Gohr        . ' as Setext underline). Setext headings deliberately not'
110b414dba2SAndreas Gohr        . ' supported (see #50); also depends on internal-space HR'
111b414dba2SAndreas Gohr        . ' support DokuWiki lacks (see #21-23).',
112b414dba2SAndreas Gohr    76 => 'Setext heading: backslash-escaped underline `\\---` keeps'
113b414dba2SAndreas Gohr        . ' content as paragraph. Setext headings deliberately not'
114b414dba2SAndreas Gohr        . ' supported (see #50).',
115b414dba2SAndreas Gohr
116b414dba2SAndreas Gohr    // --------------------------------------------------------------------
117b1c59bedSAndreas Gohr    // Fenced code blocks (GfmCode / GfmFile) — deliberate simplifications
118b1c59bedSAndreas Gohr    // versus strict GFM. All of these are consequences of lexer constraints
119b1c59bedSAndreas Gohr    // (no regex backreferences) or the deliberate column-0-only policy.
120b1c59bedSAndreas Gohr    // --------------------------------------------------------------------
121b1c59bedSAndreas Gohr    94  => 'fenced code: closing fence must be ≥ opening length — DokuWiki'
122b1c59bedSAndreas Gohr         . ' accepts any 3+ run as a closer (no regex backreferences for'
123b1c59bedSAndreas Gohr         . ' length pairing). Deliberate relaxation.',
124b1c59bedSAndreas Gohr    95  => 'fenced code (tilde variant): closing fence must be ≥ opening'
125b1c59bedSAndreas Gohr         . ' length — see example 94.',
126b1c59bedSAndreas Gohr    96  => 'fenced code: unclosed fence — DokuWiki convention requires a'
127b1c59bedSAndreas Gohr         . ' closer (matches DW <code> tag), so unclosed fences stay'
128b414dba2SAndreas Gohr         . ' literal rather than consuming to EOF. GFM\'s "close at end"'
129b414dba2SAndreas Gohr         . ' rule is really "close at any container boundary" in'
130b414dba2SAndreas Gohr         . ' CommonMark\'s two-pass block parser, which our single-pass'
131b414dba2SAndreas Gohr         . ' lexer cannot implement.',
132b1c59bedSAndreas Gohr    97  => 'fenced code: unclosed fence with intervening short run — stays'
133b1c59bedSAndreas Gohr         . ' literal, see example 96.',
134b414dba2SAndreas Gohr    98  => 'fenced code inside blockquote: GFM closes the fence at the'
135b414dba2SAndreas Gohr         . ' blockquote\'s end, but DokuWiki requires an explicit closing'
136b414dba2SAndreas Gohr         . ' fence and the single-pass lexer has no notion of container'
137b414dba2SAndreas Gohr         . ' boundaries to close at. Same root cause as example 96 —'
138b414dba2SAndreas Gohr         . ' unclosed fences stay literal.',
139b1c59bedSAndreas Gohr    101 => 'fenced code: opener indented 1 space — DokuWiki requires'
140b1c59bedSAndreas Gohr         . ' column-0 fences. Indent tolerance + per-line body dedent out'
141b1c59bedSAndreas Gohr         . ' of scope.',
142b1c59bedSAndreas Gohr    102 => 'fenced code: opener indented 2 spaces — see example 101.',
143b1c59bedSAndreas Gohr    103 => 'fenced code: opener indented 3 spaces — see example 101.',
144b1c59bedSAndreas Gohr    105 => 'fenced code: closer indented 2 spaces — column-0-only policy,'
145b1c59bedSAndreas Gohr         . ' see example 101.',
146b1c59bedSAndreas Gohr    106 => 'fenced code: indented opener with less-indented closer —'
147b1c59bedSAndreas Gohr         . ' column-0-only policy, see example 101.',
148b1c59bedSAndreas Gohr    107 => 'fenced code: 4-space-indented closer — with column-0-only'
149b1c59bedSAndreas Gohr         . ' policy there is no valid closer, so the fence stays literal'
150b1c59bedSAndreas Gohr         . ' (see example 96).',
151b1c59bedSAndreas Gohr    109 => 'fenced code: malformed closer `~~~ ~~` (space-broken run) —'
152b1c59bedSAndreas Gohr         . ' with no valid closer the fence stays literal (see example 96).',
153b1c59bedSAndreas Gohr    108 => 'fenced code: `` `` is not a valid fence; GFM falls back to an'
154b1c59bedSAndreas Gohr         . ' inline code span of length 3. Inline spans with n≥3 not'
155b1c59bedSAndreas Gohr         . ' implemented (GfmBacktickSingle/Double cover only n=1, n=2).',
156b1c59bedSAndreas Gohr    111 => 'fenced code interrupting Setext heading (`foo\n---`): Setext'
157685560ebSAndreas Gohr         . ' headings are deliberately not supported — the `---` underline'
158685560ebSAndreas Gohr         . ' collides with DokuWiki\'s horizontal rule and `===` would'
159685560ebSAndreas Gohr         . ' collide with DokuWiki heading syntax.',
160b1c59bedSAndreas Gohr    115 => 'fenced code: `` `` backtick-fence-with-backticks-in-info-string'
161b1c59bedSAndreas Gohr         . ' is invalid; GFM falls back to n=3 inline span — inline spans'
162b1c59bedSAndreas Gohr         . ' with n≥3 not implemented. See example 108.',
163b1c59bedSAndreas Gohr
164b1c59bedSAndreas Gohr    // --------------------------------------------------------------------
165b414dba2SAndreas Gohr    // HTML blocks (§4.6) — raw HTML pass-through is not supported
166b414dba2SAndreas Gohr    // --------------------------------------------------------------------
167b414dba2SAndreas Gohr    118 => 'raw HTML block (script/pre/style/textarea group): raw HTML pass-through not supported — DokuWiki escapes `<` as `&lt;`',
168b414dba2SAndreas Gohr    119 => 'raw HTML block: raw HTML pass-through not supported',
169b414dba2SAndreas Gohr    120 => 'raw HTML block: raw HTML pass-through not supported',
170b414dba2SAndreas Gohr    121 => 'raw HTML block: raw HTML pass-through not supported',
171b414dba2SAndreas Gohr    122 => 'raw HTML block (comment): raw HTML pass-through not supported',
172b414dba2SAndreas Gohr    123 => 'raw HTML block (processing instruction): raw HTML pass-through not supported',
173b414dba2SAndreas Gohr    124 => 'raw HTML block (declaration): raw HTML pass-through not supported',
174b414dba2SAndreas Gohr    125 => 'raw HTML block (CDATA): raw HTML pass-through not supported',
175b414dba2SAndreas Gohr    126 => 'raw HTML block (block-level tag group): raw HTML pass-through not supported',
176b414dba2SAndreas Gohr    127 => 'raw HTML block: raw HTML pass-through not supported',
177b414dba2SAndreas Gohr    128 => 'raw HTML block: raw HTML pass-through not supported',
178b414dba2SAndreas Gohr    129 => 'raw HTML block: raw HTML pass-through not supported',
179b414dba2SAndreas Gohr    130 => 'raw HTML block: raw HTML pass-through not supported',
180b414dba2SAndreas Gohr    131 => 'raw HTML block: raw HTML pass-through not supported',
181b414dba2SAndreas Gohr    132 => 'raw HTML block: raw HTML pass-through not supported',
182b414dba2SAndreas Gohr    133 => 'raw HTML block: raw HTML pass-through not supported',
183b414dba2SAndreas Gohr    134 => 'raw HTML block: raw HTML pass-through not supported',
184b414dba2SAndreas Gohr    135 => 'raw HTML block: raw HTML pass-through not supported',
185b414dba2SAndreas Gohr    136 => 'raw HTML block (any-tag group): raw HTML pass-through not supported',
186b414dba2SAndreas Gohr    137 => 'raw HTML block: raw HTML pass-through not supported',
187b414dba2SAndreas Gohr    138 => 'raw HTML block: raw HTML pass-through not supported',
188b414dba2SAndreas Gohr    139 => 'raw HTML block: raw HTML pass-through not supported',
189b414dba2SAndreas Gohr    140 => 'raw HTML block: raw HTML pass-through not supported',
190b414dba2SAndreas Gohr    141 => 'raw HTML block: raw HTML pass-through not supported',
191b414dba2SAndreas Gohr    142 => 'raw HTML block: raw HTML pass-through not supported',
192b414dba2SAndreas Gohr    143 => 'raw HTML block: raw HTML pass-through not supported',
193b414dba2SAndreas Gohr    144 => 'raw HTML block: raw HTML pass-through not supported',
194b414dba2SAndreas Gohr    145 => 'raw HTML block: raw HTML pass-through not supported',
195b414dba2SAndreas Gohr    146 => 'raw HTML block: raw HTML pass-through not supported',
196b414dba2SAndreas Gohr    147 => 'raw HTML block: raw HTML pass-through not supported',
197b414dba2SAndreas Gohr    148 => 'raw HTML block: raw HTML pass-through not supported',
198b414dba2SAndreas Gohr    149 => 'raw HTML block: raw HTML pass-through not supported',
199b414dba2SAndreas Gohr    150 => 'raw HTML block: raw HTML pass-through not supported',
200b414dba2SAndreas Gohr    151 => 'raw HTML block: raw HTML pass-through not supported',
201b414dba2SAndreas Gohr    152 => 'raw HTML block: raw HTML pass-through not supported',
202b414dba2SAndreas Gohr    153 => 'raw HTML block: raw HTML pass-through not supported',
203b414dba2SAndreas Gohr    154 => 'raw HTML block: raw HTML pass-through not supported',
204b414dba2SAndreas Gohr    155 => 'raw HTML block: raw HTML pass-through not supported',
205b414dba2SAndreas Gohr    156 => 'raw HTML block: raw HTML pass-through not supported',
206b414dba2SAndreas Gohr    157 => 'raw HTML block: raw HTML pass-through not supported',
207b414dba2SAndreas Gohr    158 => 'raw HTML block: raw HTML pass-through not supported',
208b414dba2SAndreas Gohr    159 => 'raw HTML block: raw HTML pass-through not supported',
209b414dba2SAndreas Gohr    160 => 'raw HTML block: raw HTML pass-through not supported',
210b414dba2SAndreas Gohr
211b414dba2SAndreas Gohr    // --------------------------------------------------------------------
212b414dba2SAndreas Gohr    // Link reference definitions (§4.7) — single-pass lexer cannot resolve
213b414dba2SAndreas Gohr    // forward references, so the `[foo]: /url` definition lines are not
214b414dba2SAndreas Gohr    // recognised and the matching `[foo]` references stay literal. Same
215b414dba2SAndreas Gohr    // rationale as the reference-link entries at #535-579.
216b414dba2SAndreas Gohr    // Examples #168, #180-182 are NOT listed: their definitions are
217b414dba2SAndreas Gohr    // invalid (empty URL / inside indented code / inside fenced code /
218b414dba2SAndreas Gohr    // attached to a paragraph), so the spec also expects literal output
219b414dba2SAndreas Gohr    // for the `[foo]` reference, and DW agrees.
220b414dba2SAndreas Gohr    // --------------------------------------------------------------------
221b414dba2SAndreas Gohr    161 => 'link reference definition: forward-reference definitions not supported (single-pass lexer)',
222b414dba2SAndreas Gohr    162 => 'link reference definition: forward-reference definitions not supported (single-pass lexer)',
223b414dba2SAndreas Gohr    163 => 'link reference definition (multi-line title): forward-reference definitions not supported (single-pass lexer)',
224b414dba2SAndreas Gohr    164 => 'link reference definition (case-insensitive label): forward-reference definitions not supported (single-pass lexer)',
225b414dba2SAndreas Gohr    165 => 'link reference definition (Unicode case folding): forward-reference definitions not supported (single-pass lexer)',
226b414dba2SAndreas Gohr    166 => 'link reference definition (whitespace-collapsed label): forward-reference definitions not supported (single-pass lexer)',
227b414dba2SAndreas Gohr    167 => 'link reference definition (no link text used): forward-reference definitions not supported (single-pass lexer)',
228b414dba2SAndreas Gohr    169 => 'link reference definition (pointy-bracket destination): forward-reference definitions not supported (single-pass lexer)',
229b414dba2SAndreas Gohr    170 => 'link reference definition (no title, blank line in between): forward-reference definitions not supported (single-pass lexer)',
230b414dba2SAndreas Gohr    171 => 'link reference definition (title only, no destination): forward-reference definitions not supported (single-pass lexer)',
231b414dba2SAndreas Gohr    172 => 'link reference definition (multiple definitions): forward-reference definitions not supported (single-pass lexer)',
232b414dba2SAndreas Gohr    173 => 'link reference definition (first wins on duplicate label): forward-reference definitions not supported (single-pass lexer)',
233b414dba2SAndreas Gohr    174 => 'link reference definition (label case-insensitive): forward-reference definitions not supported (single-pass lexer)',
234b414dba2SAndreas Gohr    175 => 'link reference definition (used as paragraph delimiter): forward-reference definitions not supported (single-pass lexer)',
235b414dba2SAndreas Gohr    176 => 'link reference definition (no body following): forward-reference definitions not supported (single-pass lexer)',
236b414dba2SAndreas Gohr    177 => 'link reference definition (label with surrounding whitespace): forward-reference definitions not supported (single-pass lexer)',
237b414dba2SAndreas Gohr    178 => 'link reference definition (indented up to 3 spaces): forward-reference definitions not supported (single-pass lexer)',
238b414dba2SAndreas Gohr    179 => 'link reference definition (multi-line definition with title): forward-reference definitions not supported (single-pass lexer)',
239b414dba2SAndreas Gohr    183 => 'link reference definition (does not interrupt paragraph): forward-reference definitions not supported (single-pass lexer)',
240b414dba2SAndreas Gohr    184 => 'link reference definition (between blockquote and paragraph): forward-reference definitions not supported (single-pass lexer)',
241b414dba2SAndreas Gohr    185 => 'link reference definition (lone definition emits nothing): forward-reference definitions not supported (single-pass lexer)',
242b414dba2SAndreas Gohr    186 => 'link reference definition (definition then HR): forward-reference definitions not supported (single-pass lexer)',
243b414dba2SAndreas Gohr    187 => 'link reference definition (multiple defs in a row): forward-reference definitions not supported (single-pass lexer)',
244b414dba2SAndreas Gohr    188 => 'link reference definition (def inside blockquote): forward-reference definitions not supported (single-pass lexer)',
245b414dba2SAndreas Gohr    329 => 'reference link with entity-decoded URL in definition: depends on'
246b414dba2SAndreas Gohr         . ' link reference definitions, which forward-reference definitions'
247b414dba2SAndreas Gohr         . ' are not supported (single-pass lexer)',
248b414dba2SAndreas Gohr
249b414dba2SAndreas Gohr    // --------------------------------------------------------------------
2508ed75a23SAndreas Gohr    // Code-span edge cases that collide with project-wide decisions
2518ed75a23SAndreas Gohr    // (no raw HTML, no GFM angle-bracket autolinks, typography on by
2528ed75a23SAndreas Gohr    // default) or with the single-pass lexer's limits.
2538ed75a23SAndreas Gohr    // --------------------------------------------------------------------
2548ed75a23SAndreas Gohr    351 => 'code span vs. emphasis: cross-positional precedence would require'
2558ed75a23SAndreas Gohr         . ' a pre-scan pass — the single-pass lexer matches leftmost-first'
2568ed75a23SAndreas Gohr         . ' and cannot reject an earlier emphasis opener because a later'
2578ed75a23SAndreas Gohr         . ' backtick span would consume its closer',
258b414dba2SAndreas Gohr    352 => 'code span vs. link `[not a `link](/foo`)`: the link opener is'
259b414dba2SAndreas Gohr         . ' leftmost but a backtick span inside its label should consume'
260b414dba2SAndreas Gohr         . ' the closing `]` and `)` — single-pass lexer matches'
261b414dba2SAndreas Gohr         . ' leftmost-first and cannot reorder spans (see #351).',
2628ed75a23SAndreas Gohr    353 => 'code span: the trailing `"` outside the span is converted to a'
2638ed75a23SAndreas Gohr         . ' curly quote by DokuWiki typography, diverging from the spec HTML',
264b414dba2SAndreas Gohr    327 => 'raw HTML tag with entity in attribute: raw HTML pass-through not supported',
265b414dba2SAndreas Gohr    354 => 'raw HTML tag pass-through: raw HTML pass-through not supported',
2668ed75a23SAndreas Gohr    356 => 'GFM angle-bracket autolink `<http://…>`: not implemented — we'
2678ed75a23SAndreas Gohr         . ' rely on DokuWiki\'s existing bare-URL detection, which does not'
2688ed75a23SAndreas Gohr         . ' parse `<URL>` form',
2698ed75a23SAndreas Gohr
2708ed75a23SAndreas Gohr    // --------------------------------------------------------------------
27172b2703bSAndreas Gohr    // CommonMark §6.2 flanking-delimiter analysis — deliberately not
27272b2703bSAndreas Gohr    // implemented. DokuWiki's regex lexer uses leftmost-match and cannot
27372b2703bSAndreas Gohr    // apply CommonMark's left/right-flanking rules that distinguish
27472b2703bSAndreas Gohr    // word-chars, whitespace, and punctuation for `*`/`_` delimiters, or
27572b2703bSAndreas Gohr    // the "multiple-of-3" rule for overlapping runs. These examples all
27672b2703bSAndreas Gohr    // rely on that machinery.
27772b2703bSAndreas Gohr    // --------------------------------------------------------------------
27872b2703bSAndreas Gohr
27972b2703bSAndreas Gohr    // Unicode whitespace in flanking context. Our `\s` is ASCII-only
28072b2703bSAndreas Gohr    // because the lexer doesn't set the PCRE `u` flag.
28172b2703bSAndreas Gohr    363 => 'Unicode whitespace (U+00A0) flanking — requires u-flag-aware regex',
28272b2703bSAndreas Gohr
28372b2703bSAndreas Gohr    // Punctuation-adjacent flanking for `*` / `_` / `**` / `__`
28472b2703bSAndreas Gohr    362 => 'flanking: punctuation-adjacent `*` (left-flanking vs. right-flanking)',
28572b2703bSAndreas Gohr    368 => 'flanking: punctuation-adjacent `_`',
28672b2703bSAndreas Gohr    372 => 'flanking: intraword `_` with punctuation inside',
28772b2703bSAndreas Gohr    377 => 'flanking: `*` followed by `(` requires punctuation-aware flanking',
28872b2703bSAndreas Gohr    378 => 'flanking: nested `*(*foo*)*` requires flanking + balanced-pair analysis',
28972b2703bSAndreas Gohr    382 => 'flanking: nested `_(_foo_)_` requires flanking + balanced-pair analysis',
29072b2703bSAndreas Gohr    389 => 'flanking: punctuation-adjacent `**`',
29172b2703bSAndreas Gohr    394 => 'flanking: punctuation-adjacent `__`',
29272b2703bSAndreas Gohr    401 => 'flanking: `**` followed by `(`',
29372b2703bSAndreas Gohr    404 => 'flanking: nested `*bar*` inside `**foo ... foo**` with punctuation',
29472b2703bSAndreas Gohr    407 => 'flanking: `__` followed by `(`',
29572b2703bSAndreas Gohr    470 => 'flanking: nested `*_foo_*` requires balanced-pair analysis',
29672b2703bSAndreas Gohr    472 => 'flanking: nested `_*foo*_` requires balanced-pair analysis',
29772b2703bSAndreas Gohr
29872b2703bSAndreas Gohr    // Intraword `__` strong (even multibyte) — flanking rule for `_` requires
29972b2703bSAndreas Gohr    // examining whether the delimiter run is word-boundary-flanking, which our
30072b2703bSAndreas Gohr    // simple lookbehind/lookahead approximation doesn't fully match.
30172b2703bSAndreas Gohr    395 => 'flanking: intraword `__` (`foo__bar__`) — left-flanking vs right-flanking',
30272b2703bSAndreas Gohr    396 => 'flanking: intraword `__` across digits (`5__6__78`)',
30372b2703bSAndreas Gohr    397 => 'flanking: intraword `__` with Cyrillic',
30472b2703bSAndreas Gohr    398 => 'flanking: `__foo, __bar__, baz__` — flanking + balanced pairing',
30572b2703bSAndreas Gohr    409 => 'flanking: `__foo__bar` — intraword close',
30672b2703bSAndreas Gohr    410 => 'flanking: intraword `__` with Cyrillic (leading)',
30772b2703bSAndreas Gohr    411 => 'flanking: `__foo__bar__baz__` — multiple `__` pairs with flanking',
30872b2703bSAndreas Gohr    412 => 'flanking: `__(bar)__.` — punctuation-adjacent',
30972b2703bSAndreas Gohr
31072b2703bSAndreas Gohr    // Overlapping / multiple-of-3 rule for runs
31172b2703bSAndreas Gohr    416 => 'CommonMark rule 9 (overlapping same-delimiter `_foo _bar_ baz_`)',
31272b2703bSAndreas Gohr    417 => 'CommonMark overlapping `_` / `__` with flanking',
31372b2703bSAndreas Gohr    418 => 'CommonMark overlapping `*foo *bar**` — multiple-of-3 rule',
31472b2703bSAndreas Gohr    419 => 'CommonMark nested `*foo **bar** baz*` — balanced-pair analysis',
31572b2703bSAndreas Gohr    421 => 'CommonMark overlapping `*foo**bar*` — multiple-of-3',
31672b2703bSAndreas Gohr    422 => 'CommonMark nested `***foo** bar*` — triple-delimiter analysis',
31772b2703bSAndreas Gohr    423 => 'CommonMark nested `*foo **bar***` — triple-delimiter analysis',
31872b2703bSAndreas Gohr    424 => 'CommonMark nested `*foo**bar***` — triple-delimiter analysis',
31972b2703bSAndreas Gohr    425 => 'CommonMark triple `foo***bar***baz` — triple-delimiter analysis',
32072b2703bSAndreas Gohr    426 => 'CommonMark long delimiter runs `foo******bar*********baz`',
32172b2703bSAndreas Gohr    427 => 'CommonMark deeply nested `*foo **bar *baz* bim** bop*`',
32272b2703bSAndreas Gohr    434 => 'CommonMark overlapping `__foo __bar__ baz__` — multiple-of-3',
32372b2703bSAndreas Gohr    435 => 'CommonMark `____foo__ bar__` — leading long delimiter run',
32472b2703bSAndreas Gohr    436 => 'CommonMark `**foo **bar****` — trailing long delimiter run',
32572b2703bSAndreas Gohr    439 => 'CommonMark nested `***foo* bar**` — triple-delimiter',
32672b2703bSAndreas Gohr    440 => 'CommonMark nested `**foo *bar***` — triple-delimiter',
32772b2703bSAndreas Gohr    441 => 'CommonMark deeply nested `**foo *bar **baz** bim* bop**`',
32872b2703bSAndreas Gohr
32972b2703bSAndreas Gohr    // `__foo_` / `_foo__` — mixing `_` and `__` requires flanking to decide
33072b2703bSAndreas Gohr    // which delimiter pairs open/close.
33172b2703bSAndreas Gohr    463 => 'flanking: `__foo_` — mixed `_`/`__` pairing',
33272b2703bSAndreas Gohr    464 => 'flanking: `_foo__` — mixed `_`/`__` pairing',
33372b2703bSAndreas Gohr    465 => 'flanking: `___foo__` — delimiter-run length analysis',
33472b2703bSAndreas Gohr    466 => 'flanking: `____foo_` — delimiter-run length analysis',
33572b2703bSAndreas Gohr    467 => 'flanking: `__foo___` — delimiter-run length analysis',
33672b2703bSAndreas Gohr    468 => 'flanking: `_foo____` — delimiter-run length analysis',
33772b2703bSAndreas Gohr
33872b2703bSAndreas Gohr    // Long delimiter runs require excess-drop logic (2 outer chars dropped
33972b2703bSAndreas Gohr    // from each side). Stack-based pairing needed — out of scope.
34072b2703bSAndreas Gohr    473 => 'CommonMark `****foo****` — excess-drop (4+4 → strong only)',
34172b2703bSAndreas Gohr    474 => 'CommonMark `____foo____` — excess-drop (4+4 → strong only)',
34272b2703bSAndreas Gohr    475 => 'CommonMark `******foo******` — excess-drop (6+6 → strong only)',
34372b2703bSAndreas Gohr    477 => 'CommonMark `_____foo_____` — excess-drop (5+5 → em+strong, 2 dropped each side)',
34472b2703bSAndreas Gohr
34572b2703bSAndreas Gohr    // Overlapping / crossing delimiters
34672b2703bSAndreas Gohr    478 => 'CommonMark `*foo _bar* baz_` — overlapping different delimiters',
34772b2703bSAndreas Gohr    479 => 'CommonMark `*foo __bar *baz bim__ bam*` — crossing delimiters',
34872b2703bSAndreas Gohr    480 => 'CommonMark `**foo **bar baz**` — overlapping same delimiter',
3498719732dSAndreas Gohr
350b414dba2SAndreas Gohr    // Emphasis vs. angle-bracket autolink: same root cause as #351 (the
351b414dba2SAndreas Gohr    // single-pass lexer matches leftmost-first and cannot reject an
352b414dba2SAndreas Gohr    // earlier `**`/`__` opener because a later `<URL>` autolink would
353b414dba2SAndreas Gohr    // consume its closer).
354b414dba2SAndreas Gohr    489 => 'emphasis vs. angle-bracket autolink `**a<http://...?q=**>`:'
355b414dba2SAndreas Gohr         . ' leftmost-match cannot reorder spans — see #351 for the'
356b414dba2SAndreas Gohr         . ' single-pass-lexer rationale.',
357b414dba2SAndreas Gohr    490 => 'emphasis vs. angle-bracket autolink `__a<http://...?q=__>`:'
358b414dba2SAndreas Gohr         . ' leftmost-match cannot reorder spans — see #351.',
359b414dba2SAndreas Gohr
3608719732dSAndreas Gohr    // --------------------------------------------------------------------
361e89aeebdSAndreas Gohr    // Inline link `[text](url)` — features GfmLink deliberately does not
362e89aeebdSAndreas Gohr    // implement. Either rarely-used syntax paid for with disproportionate
363e89aeebdSAndreas Gohr    // regex complexity, or single-pass-lexer limits that can't be worked
364e89aeebdSAndreas Gohr    // around inside one mode.
365e89aeebdSAndreas Gohr    // --------------------------------------------------------------------
366e89aeebdSAndreas Gohr
367e89aeebdSAndreas Gohr    // GFM link title attribute (`"title"` / `'title'` / `(title)` after
368e89aeebdSAndreas Gohr    // the URL). Parses cleanly but is discarded: DokuWiki's link handler
369e89aeebdSAndreas Gohr    // instructions have no title-attribute slot, and plumbing one through
370e89aeebdSAndreas Gohr    // every renderer is out of scope for GfmLink.
371*eb15e634SAndreas Gohr    328 => 'link with entity-decoded URL and title: URL side decodes correctly,'
372*eb15e634SAndreas Gohr         . ' but the title attribute is discarded — DokuWiki link instructions'
373*eb15e634SAndreas Gohr         . ' have no title slot.',
374e89aeebdSAndreas Gohr    493 => 'link title attribute: GfmLink parses but discards — DokuWiki link instructions have no title slot',
375e89aeebdSAndreas Gohr    513 => 'link title attribute (three quoting styles): discarded by GfmLink',
376e89aeebdSAndreas Gohr    515 => 'link title separated by non-breaking space: title slot not supported',
377e89aeebdSAndreas Gohr    516 => 'link title with nested balanced quotes: Markdown.pl quirk, not supported',
378e89aeebdSAndreas Gohr    517 => 'link title with different quote type for inner quotes: title slot not supported',
379e89aeebdSAndreas Gohr    518 => 'multi-line link title: title slot not supported',
380e89aeebdSAndreas Gohr
381e89aeebdSAndreas Gohr    // Pointy-bracket link destinations `<...>`. Rarely used; regex cost
382e89aeebdSAndreas Gohr    // and interaction with raw-HTML detection outweigh the benefit.
383e89aeebdSAndreas Gohr    496 => 'pointy-bracket link destination `<>`: not supported',
384e89aeebdSAndreas Gohr    498 => 'pointy-bracket destination with spaces `<...>`: not supported',
385e89aeebdSAndreas Gohr    500 => 'pointy-bracket destination with newline: not supported',
386e89aeebdSAndreas Gohr    501 => 'pointy-bracket destination containing `)`: not supported',
387e89aeebdSAndreas Gohr    502 => 'pointy-bracket destination with trailing backslash: not supported',
388e89aeebdSAndreas Gohr    503 => 'malformed pointy-bracket destinations: renderer output differs',
389e89aeebdSAndreas Gohr    507 => 'pointy-bracket destination wrapping unbalanced parens: not supported',
390e89aeebdSAndreas Gohr
391e89aeebdSAndreas Gohr    // Balanced-parens inside URL destinations.
392e89aeebdSAndreas Gohr    505 => 'balanced-parens in URL destination: not supported (regex single-level)',
393e89aeebdSAndreas Gohr
394e89aeebdSAndreas Gohr    // Other URL-level edges.
395e89aeebdSAndreas Gohr    495 => 'empty URL destination `[link]()`: pattern requires non-empty URL',
396e89aeebdSAndreas Gohr    510 => 'backslash in URL destination: URL-encoding differs from spec',
397e89aeebdSAndreas Gohr    511 => 'HTML entity / percent-encoding in URL: renderer normalization differs',
398e89aeebdSAndreas Gohr    512 => 'link destination that parses as a title: edge case not supported',
399b414dba2SAndreas Gohr    337 => 'entity-decoded `&quot;` inside link URL slot: spec rejects the'
400b414dba2SAndreas Gohr         . ' link because the decoded `"` would split URL from title, but'
401b414dba2SAndreas Gohr         . ' GfmLink uses a permissive `[^)\n]+` URL slot and accepts the'
402b414dba2SAndreas Gohr         . ' whole run as the URL — strict GFM URL rejection not implemented',
403e89aeebdSAndreas Gohr
404e89aeebdSAndreas Gohr    // Inherent single-pass-lexer limits for link text containing nested
405e89aeebdSAndreas Gohr    // structures. These cannot be resolved inside one mode.
406e89aeebdSAndreas Gohr    522 => 'nested bracket forms inner link, outer falls back to literal',
407e89aeebdSAndreas Gohr    526 => 'nested links: inner is a link, outer falls back to literal',
408e89aeebdSAndreas Gohr    527 => 'nested links inside emphasis: not supported',
409e89aeebdSAndreas Gohr    529 => 'link text grouping vs. emphasis: leftmost-match cannot override',
410e89aeebdSAndreas Gohr    530 => 'emphasis/bracket crossing: leftmost-match cannot override',
411e89aeebdSAndreas Gohr    532 => 'raw HTML inside link text: project-wide "no raw HTML" limit',
412e89aeebdSAndreas Gohr    533 => 'code span inside link text: requires pre-scan pass (see #351)',
413e89aeebdSAndreas Gohr    534 => 'autolink inside link text: raw `<URL>` autolinks not supported (see #356)',
414e89aeebdSAndreas Gohr
415e89aeebdSAndreas Gohr    // Reference links (`[text][id]`, `[text][]`, `[foo]` with matching
416e89aeebdSAndreas Gohr    // `[foo]: url` definition). Not implemented: resolving forward
417e89aeebdSAndreas Gohr    // references would require a two-pass parse, but DokuWiki's lexer is
418e89aeebdSAndreas Gohr    // single-pass. Inline links `[text](url)` are the only supported
419e89aeebdSAndreas Gohr    // form.
420e89aeebdSAndreas Gohr    535 => 'reference link: forward-reference definitions not supported (single-pass lexer)',
421e89aeebdSAndreas Gohr    536 => 'reference link: forward-reference definitions not supported (single-pass lexer)',
422e89aeebdSAndreas Gohr    537 => 'reference link: forward-reference definitions not supported (single-pass lexer)',
423e89aeebdSAndreas Gohr    538 => 'reference link: forward-reference definitions not supported (single-pass lexer)',
424e89aeebdSAndreas Gohr    539 => 'reference link: forward-reference definitions not supported (single-pass lexer)',
425e89aeebdSAndreas Gohr    540 => 'reference link: forward-reference definitions not supported (single-pass lexer)',
426e89aeebdSAndreas Gohr    541 => 'reference link: forward-reference definitions not supported (single-pass lexer)',
427e89aeebdSAndreas Gohr    542 => 'reference link: forward-reference definitions not supported (single-pass lexer)',
428e89aeebdSAndreas Gohr    543 => 'reference link: forward-reference definitions not supported (single-pass lexer)',
429e89aeebdSAndreas Gohr    544 => 'reference link: forward-reference definitions not supported (single-pass lexer)',
430e89aeebdSAndreas Gohr    545 => 'reference link: forward-reference definitions not supported (single-pass lexer)',
431e89aeebdSAndreas Gohr    546 => 'reference link: forward-reference definitions not supported (single-pass lexer)',
432e89aeebdSAndreas Gohr    547 => 'reference link: forward-reference definitions not supported (single-pass lexer)',
433e89aeebdSAndreas Gohr    548 => 'reference link: forward-reference definitions not supported (single-pass lexer)',
434e89aeebdSAndreas Gohr    549 => 'reference link: forward-reference definitions not supported (single-pass lexer)',
435e89aeebdSAndreas Gohr    550 => 'reference link: forward-reference definitions not supported (single-pass lexer)',
436e89aeebdSAndreas Gohr    551 => 'reference link: forward-reference definitions not supported (single-pass lexer)',
437e89aeebdSAndreas Gohr    552 => 'reference link: forward-reference definitions not supported (single-pass lexer)',
438e89aeebdSAndreas Gohr    553 => 'reference link: forward-reference definitions not supported (single-pass lexer)',
439e89aeebdSAndreas Gohr    557 => 'reference link: forward-reference definitions not supported (single-pass lexer)',
440e89aeebdSAndreas Gohr    558 => 'reference link: forward-reference definitions not supported (single-pass lexer)',
441e89aeebdSAndreas Gohr    560 => 'reference link: forward-reference definitions not supported (single-pass lexer)',
442e89aeebdSAndreas Gohr    561 => 'collapsed reference link: forward-reference definitions not supported (single-pass lexer)',
443e89aeebdSAndreas Gohr    562 => 'collapsed reference link: forward-reference definitions not supported (single-pass lexer)',
444e89aeebdSAndreas Gohr    563 => 'collapsed reference link: forward-reference definitions not supported (single-pass lexer)',
445e89aeebdSAndreas Gohr    564 => 'collapsed reference link: forward-reference definitions not supported (single-pass lexer)',
446e89aeebdSAndreas Gohr    565 => 'shortcut reference link: forward-reference definitions not supported (single-pass lexer)',
447e89aeebdSAndreas Gohr    566 => 'shortcut reference link: forward-reference definitions not supported (single-pass lexer)',
448e89aeebdSAndreas Gohr    567 => 'shortcut reference link: forward-reference definitions not supported (single-pass lexer)',
449e89aeebdSAndreas Gohr    568 => 'shortcut reference link: forward-reference definitions not supported (single-pass lexer)',
450e89aeebdSAndreas Gohr    569 => 'shortcut reference link: forward-reference definitions not supported (single-pass lexer)',
451e89aeebdSAndreas Gohr    570 => 'shortcut reference link: forward-reference definitions not supported (single-pass lexer)',
452e89aeebdSAndreas Gohr    571 => 'shortcut reference link with escape: forward-reference definitions not supported (single-pass lexer)',
453e89aeebdSAndreas Gohr    572 => 'shortcut reference link with emphasis: forward-reference definitions not supported (single-pass lexer)',
454e89aeebdSAndreas Gohr    573 => 'reference link: forward-reference definitions not supported (single-pass lexer)',
455e89aeebdSAndreas Gohr    574 => 'reference link: forward-reference definitions not supported (single-pass lexer)',
456e89aeebdSAndreas Gohr    575 => 'reference link: forward-reference definitions not supported (single-pass lexer)',
457e89aeebdSAndreas Gohr    576 => 'reference link: forward-reference definitions not supported (single-pass lexer)',
458e89aeebdSAndreas Gohr    577 => 'reference link: forward-reference definitions not supported (single-pass lexer)',
459e89aeebdSAndreas Gohr    578 => 'reference link: forward-reference definitions not supported (single-pass lexer)',
460e89aeebdSAndreas Gohr    579 => 'reference link: forward-reference definitions not supported (single-pass lexer)',
461e89aeebdSAndreas Gohr
462e89aeebdSAndreas Gohr    // --------------------------------------------------------------------
4633440a8c0SAndreas Gohr    // Inline image `![alt](url)`. The XHTML renderer's default media
4643440a8c0SAndreas Gohr    // rendering diverges from GFM's bare <img> (it wraps in a details <a>
4653440a8c0SAndreas Gohr    // with fetch.php/detail.php proxy URLs) — GfmSpecTest uses
4663440a8c0SAndreas Gohr    // SpecCompatRenderer to emit spec-shape bare <img>, so only the
4673440a8c0SAndreas Gohr    // parser-level or feature-level gaps remain as skips: title attribute
4683440a8c0SAndreas Gohr    // (no DW slot), reference images, pointy-bracket destinations, nested
4693440a8c0SAndreas Gohr    // brackets, and escape-dependent cases.
4703440a8c0SAndreas Gohr    // --------------------------------------------------------------------
4713440a8c0SAndreas Gohr
4723440a8c0SAndreas Gohr    580 => 'image with title attribute: GfmMedia discards titles (no DW slot)',
4733440a8c0SAndreas Gohr    581 => 'reference-style image: forward-reference definitions not supported (single-pass lexer)',
4743440a8c0SAndreas Gohr    582 => 'nested image-in-image `![foo ![bar](x)](y)`: alt class forbids brackets;'
4753440a8c0SAndreas Gohr         . ' leftmost-match cannot reorder — outer falls back to literal (see #526)',
4763440a8c0SAndreas Gohr    583 => 'link-in-image alt `![foo [bar](x)](y)`: alt class forbids brackets;'
4773440a8c0SAndreas Gohr         . ' leftmost-match cannot reorder — outer falls back to literal (see #526)',
4783440a8c0SAndreas Gohr    584 => 'collapsed reference-style image: forward-reference definitions not supported',
4793440a8c0SAndreas Gohr    585 => 'full reference-style image: forward-reference definitions not supported',
4803440a8c0SAndreas Gohr    587 => 'image with title attribute: title discarded (no DW slot)',
4813440a8c0SAndreas Gohr    588 => 'pointy-bracket image destination `![alt](<url>)`: not supported (see GfmLink #496)',
4823440a8c0SAndreas Gohr    590 => 'reference-style image: forward-reference definitions not supported',
4833440a8c0SAndreas Gohr    591 => 'reference-style image (case-insensitive label): forward-reference definitions not supported',
4843440a8c0SAndreas Gohr    592 => 'collapsed reference-style image `![foo][]`: forward-reference definitions not supported',
4853440a8c0SAndreas Gohr    593 => 'collapsed reference-style image with emphasis in label: forward-reference definitions not supported',
4863440a8c0SAndreas Gohr    594 => 'collapsed reference-style image (case-insensitive): forward-reference definitions not supported',
4873440a8c0SAndreas Gohr    595 => 'reference-style image with intervening whitespace: forward-reference definitions not supported',
4883440a8c0SAndreas Gohr    596 => 'shortcut reference-style image `![foo]`: forward-reference definitions not supported',
4893440a8c0SAndreas Gohr    597 => 'shortcut reference-style image with emphasis: forward-reference definitions not supported',
4903440a8c0SAndreas Gohr    598 => 'image with unescaped nested brackets `![[foo]]`: literal-fallback behavior not supported',
4913440a8c0SAndreas Gohr    599 => 'shortcut reference-style image (case-insensitive): forward-reference definitions not supported',
492b414dba2SAndreas Gohr    600 => 'image-via-reference fallback `!\[foo]` with `[foo]: /url`: forward-reference definitions not supported (single-pass lexer)',
493b414dba2SAndreas Gohr    601 => 'image-via-reference fallback `\![foo]` with `[foo]: /url`: forward-reference definitions not supported (single-pass lexer)',
4943440a8c0SAndreas Gohr
4953440a8c0SAndreas Gohr    // --------------------------------------------------------------------
4968719732dSAndreas Gohr    // ATX heading collisions with DokuWiki-specific behavior.
4978719732dSAndreas Gohr    // --------------------------------------------------------------------
4988719732dSAndreas Gohr    38 => 'ATX heading with leading spaces: GFM tolerates 0-3 spaces of'
4998719732dSAndreas Gohr        . ' indent before the opener; we require the `#` at column 0.'
5008719732dSAndreas Gohr        . ' Indent tolerance collides with DokuWiki\'s 2-space-indent'
5018719732dSAndreas Gohr        . ' preformatted block and isn\'t worth untangling',
5028719732dSAndreas Gohr    39 => 'indented code block: DokuWiki uses 2-space indent for'
5038719732dSAndreas Gohr        . ' preformatted; GFM 4-space indented code blocks are not'
5048719732dSAndreas Gohr        . ' implemented',
5058719732dSAndreas Gohr    40 => 'indented code block: 4-space indent after a paragraph is a'
5068719732dSAndreas Gohr        . ' continuation in GFM but preformatted in DokuWiki — not'
5078719732dSAndreas Gohr        . ' implemented',
5088719732dSAndreas Gohr    41 => 'ATX heading with leading spaces: second heading is indented'
5098719732dSAndreas Gohr        . ' by 2 spaces; we require the `#` at column 0',
5108719732dSAndreas Gohr    49 => 'empty ATX heading: DokuWiki\'s XHTML renderer deliberately'
5118719732dSAndreas Gohr        . ' skips blank headings (blank() guard in Doku_Renderer_xhtml::header)',
512685560ebSAndreas Gohr
513685560ebSAndreas Gohr    // --------------------------------------------------------------------
514685560ebSAndreas Gohr    // List items / Lists — list features GfmListblock deliberately does
515685560ebSAndreas Gohr    // not implement. The simplifications are by design: indentation uses
516685560ebSAndreas Gohr    // a fixed 2-space-multiple step starting at 0, lazy continuation is
517685560ebSAndreas Gohr    // not supported, and the rewriter groups items by 'u'/'o' type only.
518685560ebSAndreas Gohr    // The buckets are:
519685560ebSAndreas Gohr    //
520685560ebSAndreas Gohr    //  A. Extra spaces after the marker. CommonMark rolls them (up to
521685560ebSAndreas Gohr    //     4) into the content column; we dedent at `marker_width + 1`,
522685560ebSAndreas Gohr    //     collapsing the extras.
523685560ebSAndreas Gohr    //  B. 1- or 3-space indent for nesting (we round down to nearest 2).
524685560ebSAndreas Gohr    //  C. Lazy continuation (column-0 paragraph wrap inside an item).
525685560ebSAndreas Gohr    //  D. Strict CommonMark loose/tight classification (every blank line
526685560ebSAndreas Gohr    //     between items / inside items reclassifies; we use a simpler
527685560ebSAndreas Gohr    //     single-paragraph-tight, multi-paragraph-loose rule).
528685560ebSAndreas Gohr    //  E. Marker-character-change splits ordered lists ('.' vs ')') or
529685560ebSAndreas Gohr    //     unordered ('-' vs '+' vs '*'). Our rewriter groups by 'u' / 'o'
530685560ebSAndreas Gohr    //     type only, not by marker character.
531685560ebSAndreas Gohr    //  F. List interrupting a paragraph without a blank line — requires a
532685560ebSAndreas Gohr    //     multi-pass block parser to revisit prior text.
533685560ebSAndreas Gohr    //
534685560ebSAndreas Gohr    // Examples that depend on a pending mode (GfmQuote, GfmEscape, …) are
535685560ebSAndreas Gohr    // intentionally NOT skipped — they remain visible failing tests until
536685560ebSAndreas Gohr    // the mode lands.
537685560ebSAndreas Gohr    // --------------------------------------------------------------------
538309a0852SAndreas Gohr    // --------------------------------------------------------------------
539309a0852SAndreas Gohr    // Block quotes — deliberate scope reductions vs. strict GFM. The
540309a0852SAndreas Gohr    // unified GfmQuote mode (replacing DW Quote) covers `>` blockquotes
541309a0852SAndreas Gohr    // for both DW and MD pages, but several CommonMark blockquote rules
542309a0852SAndreas Gohr    // are out of scope:
543309a0852SAndreas Gohr    //
544309a0852SAndreas Gohr    // - 1-3 space indent before `>` (column-0-only policy, consistent
545309a0852SAndreas Gohr    //   with GfmCode / GfmFile / GfmHeader).
546309a0852SAndreas Gohr    // - Lazy continuation (paragraph text without `>` on continuation
547309a0852SAndreas Gohr    //   lines). Same policy as GfmListblock — markers required on
548309a0852SAndreas Gohr    //   every line.
549309a0852SAndreas Gohr    // - Headers inside quotes — sub-parser excludes BASEONLY so header
550309a0852SAndreas Gohr    //   instructions don't drive TOC/section-edit anchors that don't
551309a0852SAndreas Gohr    //   compose with `<blockquote>`. Same rationale as GfmListblock's
552309a0852SAndreas Gohr    //   header exclusion inside list items.
553309a0852SAndreas Gohr    // - Setext-style block constructs (the `---` underline collides
554309a0852SAndreas Gohr    //   with DW's HR rule).
555309a0852SAndreas Gohr    //
556309a0852SAndreas Gohr    // Examples that depend on still-pending modes (GfmHr) are
557309a0852SAndreas Gohr    // intentionally NOT skipped — they stay visible until those modes
558309a0852SAndreas Gohr    // land.
559309a0852SAndreas Gohr    // --------------------------------------------------------------------
560309a0852SAndreas Gohr    206 => 'block quotes: header inside quote — sub-parser excludes'
561309a0852SAndreas Gohr         . ' BASEONLY (TOC / section-edit anchors do not compose with'
562309a0852SAndreas Gohr         . ' `<blockquote>`). Same policy as GfmListblock for `<li>`.',
563309a0852SAndreas Gohr    207 => 'block quotes: header inside quote with no space after `>` —'
564309a0852SAndreas Gohr         . ' see #206 for the BASEONLY exclusion rationale.',
565309a0852SAndreas Gohr    208 => 'block quotes: leading-space `>` (1-3 spaces of indent) —'
566309a0852SAndreas Gohr         . ' column-0-only policy, consistent with GfmCode / GfmFile.',
567309a0852SAndreas Gohr    210 => 'block quotes: lazy continuation `> # Foo\n> bar\nbaz` —'
568309a0852SAndreas Gohr         . ' every quote line must begin with `>` at column 0. Same'
569309a0852SAndreas Gohr         . ' policy as GfmListblock.',
570309a0852SAndreas Gohr    211 => 'block quotes: lazy continuation `> bar\nbaz\n> foo` —'
571309a0852SAndreas Gohr         . ' see #210.',
572309a0852SAndreas Gohr    212 => 'block quotes: Setext heading underline `---` after `> foo`'
573309a0852SAndreas Gohr         . ' — no Setext headings (the `---` collides with DW HR syntax).',
574309a0852SAndreas Gohr    215 => 'block quotes: fenced code block split across blockquote'
575309a0852SAndreas Gohr         . ' boundary — fence inside quote followed by non-`>` lines'
576309a0852SAndreas Gohr         . ' depends on the same lazy-continuation rule we do not'
577309a0852SAndreas Gohr         . ' implement (see #210).',
578309a0852SAndreas Gohr    216 => 'block quotes: lazy continuation `> foo\n    - bar` — see #210.',
579309a0852SAndreas Gohr    225 => 'block quotes: lazy continuation `> bar\nbaz` — see #210.',
580309a0852SAndreas Gohr    227 => 'block quotes: lazy continuation `> bar\n>\nbaz` — see #210.',
581309a0852SAndreas Gohr    228 => 'block quotes: lazy continuation in nested quote'
582309a0852SAndreas Gohr         . ' `> > > foo\nbar` — see #210.',
583309a0852SAndreas Gohr    229 => 'block quotes: lazy continuation across nested levels'
584309a0852SAndreas Gohr         . ' `>>> foo\n> bar\n>>baz` — see #210.',
585309a0852SAndreas Gohr
586685560ebSAndreas Gohr    232 => 'list items: marker-width content-column alignment (A)',
587685560ebSAndreas Gohr    235 => 'list items: marker-width content-column alignment (A)',
588685560ebSAndreas Gohr    249 => 'list items: marker-width-driven content-column alignment for `10. foo` (A)',
589685560ebSAndreas Gohr    254 => 'list items: marker-width content-column alignment edge case (A)',
590685560ebSAndreas Gohr    258 => 'list items: marker-width content-column for `1.  foo` (A)',
591685560ebSAndreas Gohr    263 => 'list items: indent ambiguity at column 0/1/2 (B)',
592685560ebSAndreas Gohr    264 => 'list items: 1-space-indent variation (B)',
593685560ebSAndreas Gohr    265 => 'list items: marker-width with multi-line continuation (A)',
594685560ebSAndreas Gohr    266 => 'list items: marker-width with multi-line continuation (A)',
595685560ebSAndreas Gohr    267 => 'list items: lazy continuation (C)',
596685560ebSAndreas Gohr    268 => 'list items: lazy continuation (C)',
597685560ebSAndreas Gohr    270 => 'list items: lazy continuation across blank line (C+D)',
598685560ebSAndreas Gohr    273 => 'list items: list interrupting a paragraph without blank line (F)',
599685560ebSAndreas Gohr    275 => 'list items: 3-space indent rounds to 2 — sub-list under previous item (B)',
600685560ebSAndreas Gohr    276 => 'list items: marker-width content-column with mixed types (A+E)',
601685560ebSAndreas Gohr    277 => 'list items: nested markers on a single line (A)',
602685560ebSAndreas Gohr    278 => 'list items: marker-character switch splits the list (E)',
603685560ebSAndreas Gohr    281 => 'lists: marker-character change splits unordered list `-` -> `+` (E)',
604685560ebSAndreas Gohr    282 => 'lists: ordered delimiter switch splits list `.` -> `)` (E)',
605685560ebSAndreas Gohr    284 => 'lists: list interrupting paragraph without blank line (F)',
606685560ebSAndreas Gohr    286 => 'lists: marker-width content-column alignment for ordered list (A)',
607685560ebSAndreas Gohr    287 => 'lists: triple blank line + indented continuation in deeply nested item (D)',
608685560ebSAndreas Gohr    288 => 'lists: marker-character change at deeper level (E)',
609685560ebSAndreas Gohr    289 => 'lists: marker-character change with type switch (E)',
610685560ebSAndreas Gohr    290 => 'lists: 1-space-indent variations of items, all stay top-level (B)',
611685560ebSAndreas Gohr    291 => 'lists: 1-space-indent variations on ordered list (B)',
612685560ebSAndreas Gohr    292 => 'lists: marker-character change splits inside nested list (E)',
613685560ebSAndreas Gohr    293 => 'lists: marker-character change with mixed indent (E+B)',
614685560ebSAndreas Gohr    294 => 'lists: lazy continuation across types (C+E)',
615685560ebSAndreas Gohr    295 => 'lists: lazy continuation in nested list (C)',
616685560ebSAndreas Gohr    296 => 'lists: lazy continuation across blank line (C+D)',
617685560ebSAndreas Gohr    297 => 'lists: blank-line classification for loose/tight in nested list (D)',
618685560ebSAndreas Gohr    298 => 'lists: blank-line classification (D)',
619685560ebSAndreas Gohr    300 => 'lists: blank-line classification with marker change (D+E)',
620685560ebSAndreas Gohr    301 => 'lists: blank-line classification + marker-width alignment (D+A)',
621685560ebSAndreas Gohr    304 => 'lists: blank line between sub-list items affects loose/tight (D)',
622685560ebSAndreas Gohr    305 => 'lists: blank line between deeply nested items (D)',
623685560ebSAndreas Gohr    306 => 'lists: blank line at the end of a loose list affects classification (D)',
62474031e46SAndreas Gohr
62574031e46SAndreas Gohr    // --------------------------------------------------------------------
62674031e46SAndreas Gohr    // Backslash-escape examples (§6.1) that fail for reasons unrelated to
62774031e46SAndreas Gohr    // GfmEscape itself: renderer divergences, typography conversion, and
62874031e46SAndreas Gohr    // already-skipped GFM features (autolinks, raw HTML, reference links,
62974031e46SAndreas Gohr    // discarded link titles). The escape mechanic itself works.
63074031e46SAndreas Gohr    // --------------------------------------------------------------------
63174031e46SAndreas Gohr    308 => 'backslash escapes: apostrophe is rendered as `&#039;` by DW while'
63274031e46SAndreas Gohr         . ' the spec expects a literal `\'` — renderer policy difference,'
63374031e46SAndreas Gohr         . ' not an escape bug',
63474031e46SAndreas Gohr    310 => 'backslash escapes: DW typography converts straight `"..."` to curly'
63574031e46SAndreas Gohr         . ' quotes when $conf[typography] is on, diverging from spec output',
63674031e46SAndreas Gohr    316 => 'backslash escapes inside angle-bracket autolinks: GFM autolink'
63774031e46SAndreas Gohr         . ' `<URL>` form not implemented (see example 356)',
63874031e46SAndreas Gohr    317 => 'backslash escapes inside raw HTML: raw HTML pass-through is not'
63974031e46SAndreas Gohr         . ' supported by default (see example 354)',
64074031e46SAndreas Gohr    318 => 'backslash escapes in link title: title attribute is discarded — DW'
641309a0852SAndreas Gohr         . ' link instructions have no title slot',
64274031e46SAndreas Gohr    319 => 'backslash escapes in reference-link definition: link reference'
64374031e46SAndreas Gohr         . ' definitions not supported (single-pass lexer cannot resolve'
64474031e46SAndreas Gohr         . ' forward references)',
645c4bcbc2eSAndreas Gohr
646c4bcbc2eSAndreas Gohr    // --------------------------------------------------------------------
647b414dba2SAndreas Gohr    // Raw HTML (§6.6) — inline raw HTML pass-through. Same project-wide
648b414dba2SAndreas Gohr    // decision as HTML blocks (#118-160): DokuWiki escapes `<` as `&lt;`
649b414dba2SAndreas Gohr    // by default; the `<html>` block is the opt-in. Examples #637 and
650b414dba2SAndreas Gohr    // #640 are intentionally NOT listed — the spec there expects literal
651b414dba2SAndreas Gohr    // `&lt;...&gt;` escaping for malformed tags, which DW also produces,
652b414dba2SAndreas Gohr    // so they pass naturally.
653b414dba2SAndreas Gohr    // --------------------------------------------------------------------
654b414dba2SAndreas Gohr    632 => 'raw HTML inline (open tag): raw HTML pass-through not supported',
655b414dba2SAndreas Gohr    633 => 'raw HTML inline (closing tag): raw HTML pass-through not supported',
656b414dba2SAndreas Gohr    634 => 'raw HTML inline (multi-line attributes): raw HTML pass-through not supported',
657b414dba2SAndreas Gohr    635 => 'raw HTML inline (line breaks in attributes): raw HTML pass-through not supported',
658b414dba2SAndreas Gohr    636 => 'raw HTML inline (custom tags / attribute syntax): raw HTML pass-through not supported',
659b414dba2SAndreas Gohr    638 => 'raw HTML inline (illegal attribute names): raw HTML pass-through not supported',
660b414dba2SAndreas Gohr    639 => 'raw HTML inline (illegal attribute values): raw HTML pass-through not supported',
661b414dba2SAndreas Gohr    641 => 'raw HTML inline (open and closing tags): raw HTML pass-through not supported',
662b414dba2SAndreas Gohr    642 => 'raw HTML inline (HTML comment): raw HTML pass-through not supported',
663b414dba2SAndreas Gohr    643 => 'raw HTML inline (invalid comment): raw HTML pass-through not supported',
664b414dba2SAndreas Gohr    644 => 'raw HTML inline (processing instruction): raw HTML pass-through not supported',
665b414dba2SAndreas Gohr    645 => 'raw HTML inline (declaration): raw HTML pass-through not supported',
666b414dba2SAndreas Gohr    646 => 'raw HTML inline (declaration single-letter name): raw HTML pass-through not supported',
667b414dba2SAndreas Gohr    647 => 'raw HTML inline (declaration EMPTY): raw HTML pass-through not supported',
668b414dba2SAndreas Gohr    648 => 'raw HTML inline (CDATA section): raw HTML pass-through not supported',
669b414dba2SAndreas Gohr    649 => 'raw HTML inline (entity reference inside attribute): raw HTML pass-through not supported',
670b414dba2SAndreas Gohr    650 => 'raw HTML inline (backslash escape inside attribute): raw HTML pass-through not supported',
671b414dba2SAndreas Gohr    651 => 'raw HTML inline (entity-escaped quote inside attribute): raw HTML pass-through not supported',
672b414dba2SAndreas Gohr
673b414dba2SAndreas Gohr    // --------------------------------------------------------------------
674c4bcbc2eSAndreas Gohr    // Hard line breaks (GfmLinebreak) — both delimiter forms (two trailing
675c4bcbc2eSAndreas Gohr    // spaces and `\` before newline) work in paragraphs, emphasis, and
676c4bcbc2eSAndreas Gohr    // other inline containers. The skipped cases sit inside raw HTML tags,
677c4bcbc2eSAndreas Gohr    // which DokuWiki does not pass through by default.
678c4bcbc2eSAndreas Gohr    // --------------------------------------------------------------------
679b414dba2SAndreas Gohr    662 => 'hard line break inside a raw HTML tag: raw HTML pass-through not supported',
680c4bcbc2eSAndreas Gohr    663 => 'hard line break (backslash form) inside a raw HTML tag — see'
681c4bcbc2eSAndreas Gohr         . ' #662. Raw HTML out of scope.',
68272b2703bSAndreas Gohr];
683