hdl.py 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382
  1. # -*- coding: utf-8 -*-
  2. """
  3. pygments.lexers.hdl
  4. ~~~~~~~~~~~~~~~~~~~
  5. Lexers for hardware descriptor languages.
  6. :copyright: Copyright 2006-2017 by the Pygments team, see AUTHORS.
  7. :license: BSD, see LICENSE for details.
  8. """
  9. import re
  10. from pygments.lexer import RegexLexer, bygroups, include, using, this, words
  11. from pygments.token import Text, Comment, Operator, Keyword, Name, String, \
  12. Number, Punctuation, Error
  13. __all__ = ['VerilogLexer', 'SystemVerilogLexer', 'VhdlLexer']
  14. class VerilogLexer(RegexLexer):
  15. """
  16. For verilog source code with preprocessor directives.
  17. .. versionadded:: 1.4
  18. """
  19. name = 'verilog'
  20. aliases = ['verilog', 'v']
  21. filenames = ['*.v']
  22. mimetypes = ['text/x-verilog']
  23. #: optional Comment or Whitespace
  24. _ws = r'(?:\s|//.*?\n|/[*].*?[*]/)+'
  25. tokens = {
  26. 'root': [
  27. (r'^\s*`define', Comment.Preproc, 'macro'),
  28. (r'\n', Text),
  29. (r'\s+', Text),
  30. (r'\\\n', Text), # line continuation
  31. (r'/(\\\n)?/(\n|(.|\n)*?[^\\]\n)', Comment.Single),
  32. (r'/(\\\n)?[*](.|\n)*?[*](\\\n)?/', Comment.Multiline),
  33. (r'[{}#@]', Punctuation),
  34. (r'L?"', String, 'string'),
  35. (r"L?'(\\.|\\[0-7]{1,3}|\\x[a-fA-F0-9]{1,2}|[^\\\'\n])'", String.Char),
  36. (r'(\d+\.\d*|\.\d+|\d+)[eE][+-]?\d+[lL]?', Number.Float),
  37. (r'(\d+\.\d*|\.\d+|\d+[fF])[fF]?', Number.Float),
  38. (r'([0-9]+)|(\'h)[0-9a-fA-F]+', Number.Hex),
  39. (r'([0-9]+)|(\'b)[01]+', Number.Bin),
  40. (r'([0-9]+)|(\'d)[0-9]+', Number.Integer),
  41. (r'([0-9]+)|(\'o)[0-7]+', Number.Oct),
  42. (r'\'[01xz]', Number),
  43. (r'\d+[Ll]?', Number.Integer),
  44. (r'\*/', Error),
  45. (r'[~!%^&*+=|?:<>/-]', Operator),
  46. (r'[()\[\],.;\']', Punctuation),
  47. (r'`[a-zA-Z_]\w*', Name.Constant),
  48. (r'^(\s*)(package)(\s+)', bygroups(Text, Keyword.Namespace, Text)),
  49. (r'^(\s*)(import)(\s+)', bygroups(Text, Keyword.Namespace, Text),
  50. 'import'),
  51. (words((
  52. 'always', 'always_comb', 'always_ff', 'always_latch', 'and',
  53. 'assign', 'automatic', 'begin', 'break', 'buf', 'bufif0', 'bufif1',
  54. 'case', 'casex', 'casez', 'cmos', 'const', 'continue', 'deassign',
  55. 'default', 'defparam', 'disable', 'do', 'edge', 'else', 'end', 'endcase',
  56. 'endfunction', 'endgenerate', 'endmodule', 'endpackage', 'endprimitive',
  57. 'endspecify', 'endtable', 'endtask', 'enum', 'event', 'final', 'for',
  58. 'force', 'forever', 'fork', 'function', 'generate', 'genvar', 'highz0',
  59. 'highz1', 'if', 'initial', 'inout', 'input', 'integer', 'join', 'large',
  60. 'localparam', 'macromodule', 'medium', 'module', 'nand', 'negedge',
  61. 'nmos', 'nor', 'not', 'notif0', 'notif1', 'or', 'output', 'packed',
  62. 'parameter', 'pmos', 'posedge', 'primitive', 'pull0', 'pull1',
  63. 'pulldown', 'pullup', 'rcmos', 'ref', 'release', 'repeat', 'return',
  64. 'rnmos', 'rpmos', 'rtran', 'rtranif0', 'rtranif1', 'scalared', 'signed',
  65. 'small', 'specify', 'specparam', 'strength', 'string', 'strong0',
  66. 'strong1', 'struct', 'table', 'task', 'tran', 'tranif0', 'tranif1',
  67. 'type', 'typedef', 'unsigned', 'var', 'vectored', 'void', 'wait',
  68. 'weak0', 'weak1', 'while', 'xnor', 'xor'), suffix=r'\b'),
  69. Keyword),
  70. (words((
  71. 'accelerate', 'autoexpand_vectornets', 'celldefine', 'default_nettype',
  72. 'else', 'elsif', 'endcelldefine', 'endif', 'endprotect', 'endprotected',
  73. 'expand_vectornets', 'ifdef', 'ifndef', 'include', 'noaccelerate',
  74. 'noexpand_vectornets', 'noremove_gatenames', 'noremove_netnames',
  75. 'nounconnected_drive', 'protect', 'protected', 'remove_gatenames',
  76. 'remove_netnames', 'resetall', 'timescale', 'unconnected_drive',
  77. 'undef'), prefix=r'`', suffix=r'\b'),
  78. Comment.Preproc),
  79. (words((
  80. 'bits', 'bitstoreal', 'bitstoshortreal', 'countdrivers', 'display', 'fclose',
  81. 'fdisplay', 'finish', 'floor', 'fmonitor', 'fopen', 'fstrobe', 'fwrite',
  82. 'getpattern', 'history', 'incsave', 'input', 'itor', 'key', 'list', 'log',
  83. 'monitor', 'monitoroff', 'monitoron', 'nokey', 'nolog', 'printtimescale',
  84. 'random', 'readmemb', 'readmemh', 'realtime', 'realtobits', 'reset',
  85. 'reset_count', 'reset_value', 'restart', 'rtoi', 'save', 'scale', 'scope',
  86. 'shortrealtobits', 'showscopes', 'showvariables', 'showvars', 'sreadmemb',
  87. 'sreadmemh', 'stime', 'stop', 'strobe', 'time', 'timeformat', 'write'),
  88. prefix=r'\$', suffix=r'\b'),
  89. Name.Builtin),
  90. (words((
  91. 'byte', 'shortint', 'int', 'longint', 'integer', 'time',
  92. 'bit', 'logic', 'reg', 'supply0', 'supply1', 'tri', 'triand',
  93. 'trior', 'tri0', 'tri1', 'trireg', 'uwire', 'wire', 'wand', 'wo'
  94. 'shortreal', 'real', 'realtime'), suffix=r'\b'),
  95. Keyword.Type),
  96. (r'[a-zA-Z_]\w*:(?!:)', Name.Label),
  97. (r'\$?[a-zA-Z_]\w*', Name),
  98. ],
  99. 'string': [
  100. (r'"', String, '#pop'),
  101. (r'\\([\\abfnrtv"\']|x[a-fA-F0-9]{2,4}|[0-7]{1,3})', String.Escape),
  102. (r'[^\\"\n]+', String), # all other characters
  103. (r'\\\n', String), # line continuation
  104. (r'\\', String), # stray backslash
  105. ],
  106. 'macro': [
  107. (r'[^/\n]+', Comment.Preproc),
  108. (r'/[*](.|\n)*?[*]/', Comment.Multiline),
  109. (r'//.*?\n', Comment.Single, '#pop'),
  110. (r'/', Comment.Preproc),
  111. (r'(?<=\\)\n', Comment.Preproc),
  112. (r'\n', Comment.Preproc, '#pop'),
  113. ],
  114. 'import': [
  115. (r'[\w:]+\*?', Name.Namespace, '#pop')
  116. ]
  117. }
  118. def get_tokens_unprocessed(self, text):
  119. for index, token, value in \
  120. RegexLexer.get_tokens_unprocessed(self, text):
  121. # Convention: mark all upper case names as constants
  122. if token is Name:
  123. if value.isupper():
  124. token = Name.Constant
  125. yield index, token, value
  126. class SystemVerilogLexer(RegexLexer):
  127. """
  128. Extends verilog lexer to recognise all SystemVerilog keywords from IEEE
  129. 1800-2009 standard.
  130. .. versionadded:: 1.5
  131. """
  132. name = 'systemverilog'
  133. aliases = ['systemverilog', 'sv']
  134. filenames = ['*.sv', '*.svh']
  135. mimetypes = ['text/x-systemverilog']
  136. #: optional Comment or Whitespace
  137. _ws = r'(?:\s|//.*?\n|/[*].*?[*]/)+'
  138. tokens = {
  139. 'root': [
  140. (r'^\s*`define', Comment.Preproc, 'macro'),
  141. (r'^(\s*)(package)(\s+)', bygroups(Text, Keyword.Namespace, Text)),
  142. (r'^(\s*)(import)(\s+)', bygroups(Text, Keyword.Namespace, Text), 'import'),
  143. (r'\n', Text),
  144. (r'\s+', Text),
  145. (r'\\\n', Text), # line continuation
  146. (r'/(\\\n)?/(\n|(.|\n)*?[^\\]\n)', Comment.Single),
  147. (r'/(\\\n)?[*](.|\n)*?[*](\\\n)?/', Comment.Multiline),
  148. (r'[{}#@]', Punctuation),
  149. (r'L?"', String, 'string'),
  150. (r"L?'(\\.|\\[0-7]{1,3}|\\x[a-fA-F0-9]{1,2}|[^\\\'\n])'", String.Char),
  151. (r'(\d+\.\d*|\.\d+|\d+)[eE][+-]?\d+[lL]?', Number.Float),
  152. (r'(\d+\.\d*|\.\d+|\d+[fF])[fF]?', Number.Float),
  153. (r'([0-9]+)|(\'h)[0-9a-fA-F]+', Number.Hex),
  154. (r'([0-9]+)|(\'b)[01]+', Number.Bin),
  155. (r'([0-9]+)|(\'d)[0-9]+', Number.Integer),
  156. (r'([0-9]+)|(\'o)[0-7]+', Number.Oct),
  157. (r'\'[01xz]', Number),
  158. (r'\d+[Ll]?', Number.Integer),
  159. (r'\*/', Error),
  160. (r'[~!%^&*+=|?:<>/-]', Operator),
  161. (r'[()\[\],.;\']', Punctuation),
  162. (r'`[a-zA-Z_]\w*', Name.Constant),
  163. (words((
  164. 'accept_on', 'alias', 'always', 'always_comb', 'always_ff', 'always_latch',
  165. 'and', 'assert', 'assign', 'assume', 'automatic', 'before', 'begin', 'bind', 'bins',
  166. 'binsof', 'bit', 'break', 'buf', 'bufif0', 'bufif1', 'byte', 'case', 'casex', 'casez',
  167. 'cell', 'chandle', 'checker', 'class', 'clocking', 'cmos', 'config', 'const', 'constraint',
  168. 'context', 'continue', 'cover', 'covergroup', 'coverpoint', 'cross', 'deassign',
  169. 'default', 'defparam', 'design', 'disable', 'dist', 'do', 'edge', 'else', 'end', 'endcase',
  170. 'endchecker', 'endclass', 'endclocking', 'endconfig', 'endfunction', 'endgenerate',
  171. 'endgroup', 'endinterface', 'endmodule', 'endpackage', 'endprimitive',
  172. 'endprogram', 'endproperty', 'endsequence', 'endspecify', 'endtable',
  173. 'endtask', 'enum', 'event', 'eventually', 'expect', 'export', 'extends', 'extern',
  174. 'final', 'first_match', 'for', 'force', 'foreach', 'forever', 'fork', 'forkjoin',
  175. 'function', 'generate', 'genvar', 'global', 'highz0', 'highz1', 'if', 'iff', 'ifnone',
  176. 'ignore_bins', 'illegal_bins', 'implies', 'import', 'incdir', 'include',
  177. 'initial', 'inout', 'input', 'inside', 'instance', 'int', 'integer', 'interface',
  178. 'intersect', 'join', 'join_any', 'join_none', 'large', 'let', 'liblist', 'library',
  179. 'local', 'localparam', 'logic', 'longint', 'macromodule', 'matches', 'medium',
  180. 'modport', 'module', 'nand', 'negedge', 'new', 'nexttime', 'nmos', 'nor', 'noshowcancelled',
  181. 'not', 'notif0', 'notif1', 'null', 'or', 'output', 'package', 'packed', 'parameter',
  182. 'pmos', 'posedge', 'primitive', 'priority', 'program', 'property', 'protected',
  183. 'pull0', 'pull1', 'pulldown', 'pullup', 'pulsestyle_ondetect', 'pulsestyle_onevent',
  184. 'pure', 'rand', 'randc', 'randcase', 'randsequence', 'rcmos', 'real', 'realtime',
  185. 'ref', 'reg', 'reject_on', 'release', 'repeat', 'restrict', 'return', 'rnmos',
  186. 'rpmos', 'rtran', 'rtranif0', 'rtranif1', 's_always', 's_eventually', 's_nexttime',
  187. 's_until', 's_until_with', 'scalared', 'sequence', 'shortint', 'shortreal',
  188. 'showcancelled', 'signed', 'small', 'solve', 'specify', 'specparam', 'static',
  189. 'string', 'strong', 'strong0', 'strong1', 'struct', 'super', 'supply0', 'supply1',
  190. 'sync_accept_on', 'sync_reject_on', 'table', 'tagged', 'task', 'this', 'throughout',
  191. 'time', 'timeprecision', 'timeunit', 'tran', 'tranif0', 'tranif1', 'tri', 'tri0',
  192. 'tri1', 'triand', 'trior', 'trireg', 'type', 'typedef', 'union', 'unique', 'unique0',
  193. 'unsigned', 'until', 'until_with', 'untyped', 'use', 'uwire', 'var', 'vectored',
  194. 'virtual', 'void', 'wait', 'wait_order', 'wand', 'weak', 'weak0', 'weak1', 'while',
  195. 'wildcard', 'wire', 'with', 'within', 'wor', 'xnor', 'xor'), suffix=r'\b'),
  196. Keyword),
  197. (words((
  198. '`__FILE__', '`__LINE__', '`begin_keywords', '`celldefine', '`default_nettype',
  199. '`define', '`else', '`elsif', '`end_keywords', '`endcelldefine', '`endif',
  200. '`ifdef', '`ifndef', '`include', '`line', '`nounconnected_drive', '`pragma',
  201. '`resetall', '`timescale', '`unconnected_drive', '`undef', '`undefineall'),
  202. suffix=r'\b'),
  203. Comment.Preproc),
  204. (words((
  205. '$display', '$displayb', '$displayh', '$displayo', '$dumpall', '$dumpfile',
  206. '$dumpflush', '$dumplimit', '$dumpoff', '$dumpon', '$dumpports',
  207. '$dumpportsall', '$dumpportsflush', '$dumpportslimit', '$dumpportsoff',
  208. '$dumpportson', '$dumpvars', '$fclose', '$fdisplay', '$fdisplayb',
  209. '$fdisplayh', '$fdisplayo', '$feof', '$ferror', '$fflush', '$fgetc',
  210. '$fgets', '$finish', '$fmonitor', '$fmonitorb', '$fmonitorh', '$fmonitoro',
  211. '$fopen', '$fread', '$fscanf', '$fseek', '$fstrobe', '$fstrobeb', '$fstrobeh',
  212. '$fstrobeo', '$ftell', '$fwrite', '$fwriteb', '$fwriteh', '$fwriteo',
  213. '$monitor', '$monitorb', '$monitorh', '$monitoro', '$monitoroff',
  214. '$monitoron', '$plusargs', '$random', '$readmemb', '$readmemh', '$rewind',
  215. '$sformat', '$sformatf', '$sscanf', '$strobe', '$strobeb', '$strobeh', '$strobeo',
  216. '$swrite', '$swriteb', '$swriteh', '$swriteo', '$test', '$ungetc',
  217. '$value$plusargs', '$write', '$writeb', '$writeh', '$writememb',
  218. '$writememh', '$writeo'), suffix=r'\b'),
  219. Name.Builtin),
  220. (r'(class)(\s+)', bygroups(Keyword, Text), 'classname'),
  221. (words((
  222. 'byte', 'shortint', 'int', 'longint', 'integer', 'time',
  223. 'bit', 'logic', 'reg', 'supply0', 'supply1', 'tri', 'triand',
  224. 'trior', 'tri0', 'tri1', 'trireg', 'uwire', 'wire', 'wand', 'wo'
  225. 'shortreal', 'real', 'realtime'), suffix=r'\b'),
  226. Keyword.Type),
  227. (r'[a-zA-Z_]\w*:(?!:)', Name.Label),
  228. (r'\$?[a-zA-Z_]\w*', Name),
  229. ],
  230. 'classname': [
  231. (r'[a-zA-Z_]\w*', Name.Class, '#pop'),
  232. ],
  233. 'string': [
  234. (r'"', String, '#pop'),
  235. (r'\\([\\abfnrtv"\']|x[a-fA-F0-9]{2,4}|[0-7]{1,3})', String.Escape),
  236. (r'[^\\"\n]+', String), # all other characters
  237. (r'\\\n', String), # line continuation
  238. (r'\\', String), # stray backslash
  239. ],
  240. 'macro': [
  241. (r'[^/\n]+', Comment.Preproc),
  242. (r'/[*](.|\n)*?[*]/', Comment.Multiline),
  243. (r'//.*?\n', Comment.Single, '#pop'),
  244. (r'/', Comment.Preproc),
  245. (r'(?<=\\)\n', Comment.Preproc),
  246. (r'\n', Comment.Preproc, '#pop'),
  247. ],
  248. 'import': [
  249. (r'[\w:]+\*?', Name.Namespace, '#pop')
  250. ]
  251. }
  252. def get_tokens_unprocessed(self, text):
  253. for index, token, value in \
  254. RegexLexer.get_tokens_unprocessed(self, text):
  255. # Convention: mark all upper case names as constants
  256. if token is Name:
  257. if value.isupper():
  258. token = Name.Constant
  259. yield index, token, value
  260. class VhdlLexer(RegexLexer):
  261. """
  262. For VHDL source code.
  263. .. versionadded:: 1.5
  264. """
  265. name = 'vhdl'
  266. aliases = ['vhdl']
  267. filenames = ['*.vhdl', '*.vhd']
  268. mimetypes = ['text/x-vhdl']
  269. flags = re.MULTILINE | re.IGNORECASE
  270. tokens = {
  271. 'root': [
  272. (r'\n', Text),
  273. (r'\s+', Text),
  274. (r'\\\n', Text), # line continuation
  275. (r'--.*?$', Comment.Single),
  276. (r"'(U|X|0|1|Z|W|L|H|-)'", String.Char),
  277. (r'[~!%^&*+=|?:<>/-]', Operator),
  278. (r"'[a-z_]\w*", Name.Attribute),
  279. (r'[()\[\],.;\']', Punctuation),
  280. (r'"[^\n\\"]*"', String),
  281. (r'(library)(\s+)([a-z_]\w*)',
  282. bygroups(Keyword, Text, Name.Namespace)),
  283. (r'(use)(\s+)(entity)', bygroups(Keyword, Text, Keyword)),
  284. (r'(use)(\s+)([a-z_][\w.]*\.)(all)',
  285. bygroups(Keyword, Text, Name.Namespace, Keyword)),
  286. (r'(use)(\s+)([a-z_][\w.]*)',
  287. bygroups(Keyword, Text, Name.Namespace)),
  288. (r'(std|ieee)(\.[a-z_]\w*)',
  289. bygroups(Name.Namespace, Name.Namespace)),
  290. (words(('std', 'ieee', 'work'), suffix=r'\b'),
  291. Name.Namespace),
  292. (r'(entity|component)(\s+)([a-z_]\w*)',
  293. bygroups(Keyword, Text, Name.Class)),
  294. (r'(architecture|configuration)(\s+)([a-z_]\w*)(\s+)'
  295. r'(of)(\s+)([a-z_]\w*)(\s+)(is)',
  296. bygroups(Keyword, Text, Name.Class, Text, Keyword, Text,
  297. Name.Class, Text, Keyword)),
  298. (r'([a-z_]\w*)(:)(\s+)(process|for)',
  299. bygroups(Name.Class, Operator, Text, Keyword)),
  300. (r'(end)(\s+)', bygroups(using(this), Text), 'endblock'),
  301. include('types'),
  302. include('keywords'),
  303. include('numbers'),
  304. (r'[a-z_]\w*', Name),
  305. ],
  306. 'endblock': [
  307. include('keywords'),
  308. (r'[a-z_]\w*', Name.Class),
  309. (r'(\s+)', Text),
  310. (r';', Punctuation, '#pop'),
  311. ],
  312. 'types': [
  313. (words((
  314. 'boolean', 'bit', 'character', 'severity_level', 'integer', 'time',
  315. 'delay_length', 'natural', 'positive', 'string', 'bit_vector',
  316. 'file_open_kind', 'file_open_status', 'std_ulogic', 'std_ulogic_vector',
  317. 'std_logic', 'std_logic_vector', 'signed', 'unsigned'), suffix=r'\b'),
  318. Keyword.Type),
  319. ],
  320. 'keywords': [
  321. (words((
  322. 'abs', 'access', 'after', 'alias', 'all', 'and',
  323. 'architecture', 'array', 'assert', 'attribute', 'begin', 'block',
  324. 'body', 'buffer', 'bus', 'case', 'component', 'configuration',
  325. 'constant', 'disconnect', 'downto', 'else', 'elsif', 'end',
  326. 'entity', 'exit', 'file', 'for', 'function', 'generate',
  327. 'generic', 'group', 'guarded', 'if', 'impure', 'in',
  328. 'inertial', 'inout', 'is', 'label', 'library', 'linkage',
  329. 'literal', 'loop', 'map', 'mod', 'nand', 'new',
  330. 'next', 'nor', 'not', 'null', 'of', 'on',
  331. 'open', 'or', 'others', 'out', 'package', 'port',
  332. 'postponed', 'procedure', 'process', 'pure', 'range', 'record',
  333. 'register', 'reject', 'rem', 'return', 'rol', 'ror', 'select',
  334. 'severity', 'signal', 'shared', 'sla', 'sll', 'sra',
  335. 'srl', 'subtype', 'then', 'to', 'transport', 'type',
  336. 'units', 'until', 'use', 'variable', 'wait', 'when',
  337. 'while', 'with', 'xnor', 'xor'), suffix=r'\b'),
  338. Keyword),
  339. ],
  340. 'numbers': [
  341. (r'\d{1,2}#[0-9a-f_]+#?', Number.Integer),
  342. (r'\d+', Number.Integer),
  343. (r'(\d+\.\d*|\.\d+|\d+)E[+-]?\d+', Number.Float),
  344. (r'X"[0-9a-f_]+"', Number.Hex),
  345. (r'O"[0-7_]+"', Number.Oct),
  346. (r'B"[01_]+"', Number.Bin),
  347. ],
  348. }