1 // interactions between !=> and &~ mean that I need to rethink the chartage
2 // indentation styling...
3 // literal blocks [[need to ignore bracing]] double-colon style?
4 // definition -- by prior line indentation, like headings in the original structured text
7 // output formats: latex, contex, ps, pdf, html, man, txt, rfc
15 // "reference-style" links
24 // Arrows: <- -> => <= <->
27 // - attention, caution, danger, error, hint, important, note, tip, warning
30 // figure-with-caption
31 // epigraph (end-of-chapter note)
32 // compound paragraph (??)
38 // simple macros (#define) (\define)
40 // table representation
50 // FIXME: these have to go at the top so they have their dropAll bit set before PreSequence.build...
55 //////////////////////////////////////////////////////////////////////////////
59 Doc = Doc:: head:{Header} body:Body /ws
60 Header = Header:: "header" attrs:{ kv */ ws } /ws
61 Body = Body:: sections:(Section*/ws)
62 Section = { Section:: header:SectionHeader paragraphs:Paragraph* /ws }
63 SectionHeader = "==" SectionHeaderBody "=="
64 SectionHeaderBody = "=" SectionHeaderBody "="
65 > !ws (Chars:: text:alphanum++) !ws
68 blank = !sp "\n" !sp "\n" !ws
71 kv = kv:: key:word "=" val:text /ws
74 Paragraph = Blockquote:: { "\"\" " text }
78 onums = nums !(". "|") ")
81 uli = "* " (!ws text &~ any (oli|uli))
82 oli = !("# "|onums) (!ws text &~ any (oli|uli))
88 > "[]":: { UL:: uli+/ws } Itemx
89 | "[]":: { OL:: oli+/ws } Itemx
92 > "[]":: structured Itemx
94 > "[]":: (Chars:: text:alphanum++) Itemx
95 > "[]":: "\"" text "\"" Itemx
97 > "[]":: (Symbol:: sym++) Itemx
98 > "[]":: Paragraph Itemx
100 blockquote = Blockquote:: "\"\"" text "\"\""
101 | Blockquote:: "\"\"" block
103 pre = Verbatim:: "[verbatim]" { ~[]+ } /ws // FIXME doesn't work
105 styled = Underline:: "__" text "__"
106 | Footnote:: "((" text "))"
107 | TT:: "[[" text "]]"
108 | Citation:: "[" word "]"
109 | Strikethrough:: "!!" text "!!"
110 | Superscript:: "^^" (word|block)
111 | Subscript:: ",," (word|block)
112 | Smallcap:: "\\sc" block
113 | Bold:: "++" text "++"
114 | Keyword:: "!" (word|block)
115 | Italic:: "**" text "**"
119 link = Link:: text:({ text }) "->" href:(url|email)
120 > Link:: text:alphanum++ !ws "->" href:(url|email)
122 structured = command & "\\" [a-zA-Z0-9]++ block?
127 glyph = Euro:: "(e)" | "(r)" | "(c)" | "(tm)" | "--" | "..."
129 command = Today:: "\\today"
132 // URLs //////////////////////////////////////////////////////////////////////////////
134 // interesting opportunity to show off boolean grammars here: define other
135 // subtypes of url (ftp, etc) as conjunctions, but the "master pattern"
136 // only gets parsed once
139 username = [a-zA-Z0-9;/?:&=$\-_.+]++
140 password = [a-zA-Z0-9;/?:&=$\-_.+]++
141 urlc = [a-zA-Z0-9;/?:&=$\-_.+@]
144 | urlescape:: "%" [0-9] [0-9]
145 url = "mailto" ":" email -> ~urlv
146 > URL:: method:method "://" login:url_login? host:host port:(":" nums)? path:("/" urlpath)? -> ~urlv
147 url_login = Login:: username:username password:(":" password) "@"
148 method = [+\-.a-z0-9]+
149 domain = (part +/ ".") -> ~"."
150 part = [a-zA-Z0-9\-]++
151 // interesting use of boolean grammars
152 // &~ ([\-0-9] ~[]* | ~[]* [\-0-9])
154 email = Email:: user:username "@" host:host -> ~[.]
156 host = IP:: nums "." nums "." nums "." nums
161 // Tokens ///////////////////////////////////////////////////////////////////
166 quoted = "\"" ((~[\"\\] | escaped)+) "\""
173 // Chars ///////////////////////////////////////////////////////////////
177 alphanum = [a-zA-Z0-9]
178 sym = ~[a-zA-Z0-9\ \r\n=\">]