prql.xml

  1<lexer>
  2  <config>
  3    <name>PRQL</name>
  4    <alias>prql</alias>
  5    <filename>*.prql</filename>
  6    <mime_type>application/prql</mime_type>
  7  </config>
  8  <rules>
  9    <state name="root">
 10      <rule pattern="#!.*"><token type="LiteralStringDoc"/></rule>
 11      <rule pattern="#.*"><token type="CommentSingle"/></rule>
 12      <rule pattern="\s+"><token type="TextWhitespace"/></rule>
 13      <rule pattern="^(\s*)(module)(\s*)"><bygroups><token type="TextWhitespace"/><token type="KeywordNamespace"/><token type="TextWhitespace"/></bygroups><push state="imports"/></rule>
 14      <rule pattern="(bool|int|int8|int16|int32|int64|int128|float|text|set)\b"><token type="KeywordType"/></rule>
 15      <rule pattern="^prql "><token type="KeywordReserved"/></rule>
 16      <rule pattern="let"><token type="KeywordDeclaration"/></rule>
 17      <rule><include state="keywords"/></rule>
 18      <rule><include state="expr"/></rule>
 19      <rule pattern="^[A-Za-z_][a-zA-Z0-9_]*"><token type="Keyword"/></rule>
 20    </state>
 21    <state name="expr">
 22      <rule pattern="(f)(&quot;&quot;&quot;)"><bygroups><token type="LiteralStringAffix"/><token type="LiteralStringDouble"/></bygroups><combined state="fstringescape" state="tdqf"/></rule>
 23      <rule pattern="(f)(&#x27;&#x27;&#x27;)"><bygroups><token type="LiteralStringAffix"/><token type="LiteralStringSingle"/></bygroups><combined state="fstringescape" state="tsqf"/></rule>
 24      <rule pattern="(f)(&quot;)"><bygroups><token type="LiteralStringAffix"/><token type="LiteralStringDouble"/></bygroups><combined state="fstringescape" state="dqf"/></rule>
 25      <rule pattern="(f)(&#x27;)"><bygroups><token type="LiteralStringAffix"/><token type="LiteralStringSingle"/></bygroups><combined state="fstringescape" state="sqf"/></rule>
 26      <rule pattern="(s)(&quot;&quot;&quot;)"><bygroups><token type="LiteralStringAffix"/><token type="LiteralStringDouble"/></bygroups><combined state="stringescape" state="tdqf"/></rule>
 27      <rule pattern="(s)(&#x27;&#x27;&#x27;)"><bygroups><token type="LiteralStringAffix"/><token type="LiteralStringSingle"/></bygroups><combined state="stringescape" state="tsqf"/></rule>
 28      <rule pattern="(s)(&quot;)"><bygroups><token type="LiteralStringAffix"/><token type="LiteralStringDouble"/></bygroups><combined state="stringescape" state="dqf"/></rule>
 29      <rule pattern="(s)(&#x27;)"><bygroups><token type="LiteralStringAffix"/><token type="LiteralStringSingle"/></bygroups><combined state="stringescape" state="sqf"/></rule>
 30      <rule pattern="(?i)(r)(&quot;&quot;&quot;)"><bygroups><token type="LiteralStringAffix"/><token type="LiteralStringDouble"/></bygroups><push state="tdqs"/></rule>
 31      <rule pattern="(?i)(r)(&#x27;&#x27;&#x27;)"><bygroups><token type="LiteralStringAffix"/><token type="LiteralStringSingle"/></bygroups><push state="tsqs"/></rule>
 32      <rule pattern="(?i)(r)(&quot;)"><bygroups><token type="LiteralStringAffix"/><token type="LiteralStringDouble"/></bygroups><push state="dqs"/></rule>
 33      <rule pattern="(?i)(r)(&#x27;)"><bygroups><token type="LiteralStringAffix"/><token type="LiteralStringSingle"/></bygroups><push state="sqs"/></rule>
 34      <rule pattern="&quot;&quot;&quot;"><token type="LiteralStringDouble"/><combined state="stringescape" state="tdqs"/></rule>
 35      <rule pattern="&#x27;&#x27;&#x27;"><token type="LiteralStringSingle"/><combined state="stringescape" state="tsqs"/></rule>
 36      <rule pattern="&quot;"><token type="LiteralStringDouble"/><combined state="stringescape" state="dqs"/></rule>
 37      <rule pattern="&#x27;"><token type="LiteralStringSingle"/><combined state="stringescape" state="sqs"/></rule>
 38      <rule pattern="@\d{4}-\d{2}-\d{2}T\d{2}(:\d{2})?(:\d{2})?(\.\d{1,6})?(Z|[+-]\d{1,2}(:\d{1,2})?)?"><token type="LiteralDate"/></rule>
 39      <rule pattern="@\d{4}-\d{2}-\d{2}"><token type="LiteralDate"/></rule>
 40      <rule pattern="@\d{2}(:\d{2})?(:\d{2})?(\.\d{1,6})?(Z|[+-]\d{1,2}(:\d{1,2})?)?"><token type="LiteralDate"/></rule>
 41      <rule pattern="[^\S\n]+"><token type="Text"/></rule>
 42      <rule><include state="numbers"/></rule>
 43      <rule pattern="-&gt;|=&gt;|==|!=|&gt;=|&lt;=|~=|&amp;&amp;|\|\||\?\?|\/\/"><token type="Operator"/></rule>
 44      <rule pattern="[-~+/*%=&lt;&gt;&amp;^|.@]"><token type="Operator"/></rule>
 45      <rule pattern="[]{}:(),;[]"><token type="Punctuation"/></rule>
 46      <rule><include state="functions"/></rule>
 47      <rule pattern="[A-Za-z_][a-zA-Z0-9_]*"><token type="NameVariable"/></rule>
 48    </state>
 49    <state name="numbers">
 50      <rule pattern="(\d(?:_?\d)*\.(?:\d(?:_?\d)*)?|(?:\d(?:_?\d)*)?\.\d(?:_?\d)*)([eE][+-]?\d(?:_?\d)*)?"><token type="LiteralNumberFloat"/></rule>
 51      <rule pattern="\d(?:_?\d)*[eE][+-]?\d(?:_?\d)*j?"><token type="LiteralNumberFloat"/></rule>
 52      <rule pattern="0[oO](?:_?[0-7])+"><token type="LiteralNumberOct"/></rule>
 53      <rule pattern="0[bB](?:_?[01])+"><token type="LiteralNumberBin"/></rule>
 54      <rule pattern="0[xX](?:_?[a-fA-F0-9])+"><token type="LiteralNumberHex"/></rule>
 55      <rule pattern="\d(?:_?\d)*"><token type="LiteralNumberInteger"/></rule>
 56    </state>
 57    <state name="fstringescape">
 58      <rule><include state="stringescape"/></rule>
 59    </state>
 60    <state name="bytesescape">
 61      <rule pattern="\\([\\bfnrt&quot;\&#x27;]|\n|x[a-fA-F0-9]{2}|[0-7]{1,3})"><token type="LiteralStringEscape"/></rule>
 62    </state>
 63    <state name="stringescape">
 64      <rule pattern="\\(N\{.*?\}|u\{[a-fA-F0-9]{1,6}\})"><token type="LiteralStringEscape"/></rule>
 65      <rule><include state="bytesescape"/></rule>
 66    </state>
 67    <state name="fstrings-single">
 68      <rule pattern="\}"><token type="LiteralStringInterpol"/></rule>
 69      <rule pattern="\{"><token type="LiteralStringInterpol"/><push state="expr-inside-fstring"/></rule>
 70      <rule pattern="[^\\\&#x27;&quot;{}\n]+"><token type="LiteralStringSingle"/></rule>
 71      <rule pattern="[\&#x27;&quot;\\]"><token type="LiteralStringSingle"/></rule>
 72    </state>
 73    <state name="fstrings-double">
 74      <rule pattern="\}"><token type="LiteralStringInterpol"/></rule>
 75      <rule pattern="\{"><token type="LiteralStringInterpol"/><push state="expr-inside-fstring"/></rule>
 76      <rule pattern="[^\\\&#x27;&quot;{}\n]+"><token type="LiteralStringDouble"/></rule>
 77      <rule pattern="[\&#x27;&quot;\\]"><token type="LiteralStringDouble"/></rule>
 78    </state>
 79    <state name="strings-single">
 80      <rule pattern="\{((\w+)((\.\w+)|(\[[^\]]+\]))*)?(\:(.?[&lt;&gt;=\^])?[-+ ]?#?0?(\d+)?,?(\.\d+)?[E-GXb-gnosx%]?)?\}"><token type="LiteralStringInterpol"/></rule>
 81      <rule pattern="[^\\\&#x27;&quot;%{\n]+"><token type="LiteralStringSingle"/></rule>
 82      <rule pattern="[\&#x27;&quot;\\]"><token type="LiteralStringSingle"/></rule>
 83      <rule pattern="%|(\{{1,2})"><token type="LiteralStringSingle"/></rule>
 84    </state>
 85    <state name="strings-double">
 86      <rule pattern="\{((\w+)((\.\w+)|(\[[^\]]+\]))*)?(\:(.?[&lt;&gt;=\^])?[-+ ]?#?0?(\d+)?,?(\.\d+)?[E-GXb-gnosx%]?)?\}"><token type="LiteralStringInterpol"/></rule>
 87      <rule pattern="[^\\\&#x27;&quot;%{\n]+"><token type="LiteralStringDouble"/></rule>
 88      <rule pattern="[\&#x27;&quot;\\]"><token type="LiteralStringDouble"/></rule>
 89      <rule pattern="%|(\{{1,2})"><token type="LiteralStringDouble"/></rule>
 90    </state>
 91    <state name="dqf">
 92      <rule pattern="&quot;"><token type="LiteralStringDouble"/><pop depth="1"/></rule>
 93      <rule pattern="\\\\|\\&quot;|\\\n"><token type="LiteralStringEscape"/></rule>
 94      <rule><include state="fstrings-double"/></rule>
 95    </state>
 96    <state name="sqf">
 97      <rule pattern="&#x27;"><token type="LiteralStringSingle"/><pop depth="1"/></rule>
 98      <rule pattern="\\\\|\\&#x27;|\\\n"><token type="LiteralStringEscape"/></rule>
 99      <rule><include state="fstrings-single"/></rule>
100    </state>
101    <state name="dqs">
102      <rule pattern="&quot;"><token type="LiteralStringDouble"/><pop depth="1"/></rule>
103      <rule pattern="\\\\|\\&quot;|\\\n"><token type="LiteralStringEscape"/></rule>
104      <rule><include state="strings-double"/></rule>
105    </state>
106    <state name="sqs">
107      <rule pattern="&#x27;"><token type="LiteralStringSingle"/><pop depth="1"/></rule>
108      <rule pattern="\\\\|\\&#x27;|\\\n"><token type="LiteralStringEscape"/></rule>
109      <rule><include state="strings-single"/></rule>
110    </state>
111    <state name="tdqf">
112      <rule pattern="&quot;&quot;&quot;"><token type="LiteralStringDouble"/><pop depth="1"/></rule>
113      <rule><include state="fstrings-double"/></rule>
114      <rule pattern="\n"><token type="LiteralStringDouble"/></rule>
115    </state>
116    <state name="tsqf">
117      <rule pattern="&#x27;&#x27;&#x27;"><token type="LiteralStringSingle"/><pop depth="1"/></rule>
118      <rule><include state="fstrings-single"/></rule>
119      <rule pattern="\n"><token type="LiteralStringSingle"/></rule>
120    </state>
121    <state name="tdqs">
122      <rule pattern="&quot;&quot;&quot;"><token type="LiteralStringDouble"/><pop depth="1"/></rule>
123      <rule><include state="strings-double"/></rule>
124      <rule pattern="\n"><token type="LiteralStringDouble"/></rule>
125    </state>
126    <state name="tsqs">
127      <rule pattern="&#x27;&#x27;&#x27;"><token type="LiteralStringSingle"/><pop depth="1"/></rule>
128      <rule><include state="strings-single"/></rule>
129      <rule pattern="\n"><token type="LiteralStringSingle"/></rule>
130    </state>
131    <state name="expr-inside-fstring">
132      <rule pattern="[{([]"><token type="Punctuation"/><push state="expr-inside-fstring-inner"/></rule>
133      <rule pattern="(=\s*)?\}"><token type="LiteralStringInterpol"/><pop depth="1"/></rule>
134      <rule pattern="(=\s*)?:"><token type="LiteralStringInterpol"/><pop depth="1"/></rule>
135      <rule pattern="\s+"><token type="TextWhitespace"/></rule>
136      <rule><include state="expr"/></rule>
137    </state>
138    <state name="expr-inside-fstring-inner">
139      <rule pattern="[{([]"><token type="Punctuation"/><push state="expr-inside-fstring-inner"/></rule>
140      <rule pattern="[])}]"><token type="Punctuation"/><pop depth="1"/></rule>
141      <rule pattern="\s+"><token type="TextWhitespace"/></rule>
142      <rule><include state="expr"/></rule>
143    </state>
144    <state name="keywords">
145      <rule pattern="(into|case|type|module|internal)\b"><token type="Keyword"/></rule>
146      <rule pattern="(true|false|null)\b"><token type="KeywordConstant"/></rule>
147    </state>
148    <state name="functions">
149      <rule pattern="(min|max|sum|average|stddev|every|any|concat_array|count|lag|lead|first|last|rank|rank_dense|row_number|round|as|in|tuple_every|tuple_map|tuple_zip|_eq|_is_null|from_text|lower|upper|read_parquet|read_csv)\b"><token type="NameFunction"/></rule>
150    </state>
151    <state name="comment">
152      <rule pattern="-(?!\})"><token type="CommentMultiline"/></rule>
153      <rule pattern="\{-"><token type="CommentMultiline"/><push state="comment"/></rule>
154      <rule pattern="[^-}]"><token type="CommentMultiline"/></rule>
155      <rule pattern="-\}"><token type="CommentMultiline"/><pop depth="1"/></rule>
156    </state>
157    <state name="imports">
158      <rule pattern="\w+(\.\w+)*"><token type="NameClass"/><pop depth="1"/></rule>
159    </state>
160  </rules>
161</lexer>