1. <lexer>
    
  2.   <config>
    
  3.     <name>TASM</name>
    
  4.     <alias>tasm</alias>
    
  5.     <filename>*.asm</filename>
    
  6.     <filename>*.ASM</filename>
    
  7.     <filename>*.tasm</filename>
    
  8.     <mime_type>text/x-tasm</mime_type>
    
  9.     <case_insensitive>true</case_insensitive>
    
  10.   </config>
    
  11.   <rules>
    
  12.     <state name="preproc">
    
  13.       <rule pattern="[^;\n]+">
    
  14.         <token type="CommentPreproc"/>
    
  15.       </rule>
    
  16.       <rule pattern=";.*?\n">
    
  17.         <token type="CommentSingle"/>
    
  18.         <pop depth="1"/>
    
  19.       </rule>
    
  20.       <rule pattern="\n">
    
  21.         <token type="CommentPreproc"/>
    
  22.         <pop depth="1"/>
    
  23.       </rule>
    
  24.     </state>
    
  25.     <state name="whitespace">
    
  26.       <rule pattern="[\n\r]">
    
  27.         <token type="Text"/>
    
  28.       </rule>
    
  29.       <rule pattern="\\[\n\r]">
    
  30.         <token type="Text"/>
    
  31.       </rule>
    
  32.       <rule pattern="[ \t]+">
    
  33.         <token type="Text"/>
    
  34.       </rule>
    
  35.       <rule pattern=";.*">
    
  36.         <token type="CommentSingle"/>
    
  37.       </rule>
    
  38.     </state>
    
  39.     <state name="punctuation">
    
  40.       <rule pattern="[,():\[\]]+">
    
  41.         <token type="Punctuation"/>
    
  42.       </rule>
    
  43.       <rule pattern="[&amp;|^&lt;&gt;+*=/%~-]+">
    
  44.         <token type="Operator"/>
    
  45.       </rule>
    
  46.       <rule pattern="[$]+">
    
  47.         <token type="KeywordConstant"/>
    
  48.       </rule>
    
  49.       <rule pattern="seg|wrt|strict">
    
  50.         <token type="OperatorWord"/>
    
  51.       </rule>
    
  52.       <rule pattern="byte|[dq]?word">
    
  53.         <token type="KeywordType"/>
    
  54.       </rule>
    
  55.     </state>
    
  56.     <state name="root">
    
  57.       <rule pattern="^\s*%">
    
  58.         <token type="CommentPreproc"/>
    
  59.         <push state="preproc"/>
    
  60.       </rule>
    
  61.       <rule>
    
  62.         <include state="whitespace"/>
    
  63.       </rule>
    
  64.       <rule pattern="[@a-z$._?][\w$.?#@~]*:">
    
  65.         <token type="NameLabel"/>
    
  66.       </rule>
    
  67.       <rule pattern="BITS|USE16|USE32|SECTION|SEGMENT|ABSOLUTE|EXTERN|GLOBAL|ORG|ALIGN|STRUC|ENDSTRUC|ENDS|COMMON|CPU|GROUP|UPPERCASE|INCLUDE|EXPORT|LIBRARY|MODULE|PROC|ENDP|USES|ARG|DATASEG|UDATASEG|END|IDEAL|P386|MODEL|ASSUME|CODESEG|SIZE">
    
  68.         <token type="Keyword"/>
    
  69.         <push state="instruction-args"/>
    
  70.       </rule>
    
  71.       <rule pattern="([@a-z$._?][\w$.?#@~]*)(\s+)(db|dd|dw|T[A-Z][a-z]+)">
    
  72.         <bygroups>
    
  73.           <token type="NameConstant"/>
    
  74.           <token type="KeywordDeclaration"/>
    
  75.           <token type="KeywordDeclaration"/>
    
  76.         </bygroups>
    
  77.         <push state="instruction-args"/>
    
  78.       </rule>
    
  79.       <rule pattern="(?:res|d)[bwdqt]|times">
    
  80.         <token type="KeywordDeclaration"/>
    
  81.         <push state="instruction-args"/>
    
  82.       </rule>
    
  83.       <rule pattern="[@a-z$._?][\w$.?#@~]*">
    
  84.         <token type="NameFunction"/>
    
  85.         <push state="instruction-args"/>
    
  86.       </rule>
    
  87.       <rule pattern="[\r\n]+">
    
  88.         <token type="Text"/>
    
  89.       </rule>
    
  90.     </state>
    
  91.     <state name="instruction-args">
    
  92.       <rule pattern="&#34;(\\&#34;|[^&#34;\n])*&#34;|&#39;(\\&#39;|[^&#39;\n])*&#39;|`(\\`|[^`\n])*`">
    
  93.         <token type="LiteralString"/>
    
  94.       </rule>
    
  95.       <rule pattern="(?:0x[0-9a-f]+|$0[0-9a-f]*|[0-9]+[0-9a-f]*h)">
    
  96.         <token type="LiteralNumberHex"/>
    
  97.       </rule>
    
  98.       <rule pattern="[0-7]+q">
    
  99.         <token type="LiteralNumberOct"/>
    
  100.       </rule>
    
  101.       <rule pattern="[01]+b">
    
  102.         <token type="LiteralNumberBin"/>
    
  103.       </rule>
    
  104.       <rule pattern="[0-9]+\.e?[0-9]+">
    
  105.         <token type="LiteralNumberFloat"/>
    
  106.       </rule>
    
  107.       <rule pattern="[0-9]+">
    
  108.         <token type="LiteralNumberInteger"/>
    
  109.       </rule>
    
  110.       <rule>
    
  111.         <include state="punctuation"/>
    
  112.       </rule>
    
  113.       <rule pattern="r[0-9][0-5]?[bwd]|[a-d][lh]|[er]?[a-d]x|[er]?[sb]p|[er]?[sd]i|[c-gs]s|st[0-7]|mm[0-7]|cr[0-4]|dr[0-367]|tr[3-7]">
    
  114.         <token type="NameBuiltin"/>
    
  115.       </rule>
    
  116.       <rule pattern="[@a-z$._?][\w$.?#@~]*">
    
  117.         <token type="NameVariable"/>
    
  118.       </rule>
    
  119.       <rule pattern="(\\\s*)(;.*)([\r\n])">
    
  120.         <bygroups>
    
  121.           <token type="Text"/>
    
  122.           <token type="CommentSingle"/>
    
  123.           <token type="Text"/>
    
  124.         </bygroups>
    
  125.       </rule>
    
  126.       <rule pattern="[\r\n]+">
    
  127.         <token type="Text"/>
    
  128.         <pop depth="1"/>
    
  129.       </rule>
    
  130.       <rule>
    
  131.         <include state="whitespace"/>
    
  132.       </rule>
    
  133.     </state>
    
  134.   </rules>
    
  135. </lexer>