180 lines
7.0 KiB
Python
180 lines
7.0 KiB
Python
"""
|
|
pygments.lexers.forth
|
|
~~~~~~~~~~~~~~~~~~~~~
|
|
|
|
Lexer for the Forth language.
|
|
|
|
:copyright: Copyright 2006-2022 by the Pygments team, see AUTHORS.
|
|
:license: BSD, see LICENSE for details.
|
|
"""
|
|
|
|
import re
|
|
|
|
from pygments.lexer import RegexLexer, bygroups
|
|
from pygments.token import Text, Comment, Keyword, Name, String, Number, \
|
|
Whitespace
|
|
|
|
|
|
__all__ = ['ForthLexer']
|
|
|
|
|
|
class ForthLexer(RegexLexer):
|
|
"""
|
|
Lexer for Forth files.
|
|
|
|
.. versionadded:: 2.2
|
|
"""
|
|
name = 'Forth'
|
|
url = 'https://www.forth.com/forth/'
|
|
aliases = ['forth']
|
|
filenames = ['*.frt', '*.fs']
|
|
mimetypes = ['application/x-forth']
|
|
|
|
flags = re.IGNORECASE | re.MULTILINE
|
|
|
|
tokens = {
|
|
'root': [
|
|
(r'\s+', Whitespace),
|
|
# All comment types
|
|
(r'\\.*?$', Comment.Single),
|
|
(r'\([\s].*?\)', Comment.Single),
|
|
# defining words. The next word is a new command name
|
|
(r'(:|variable|constant|value|buffer:)(\s+)',
|
|
bygroups(Keyword.Namespace, Whitespace), 'worddef'),
|
|
# strings are rather simple
|
|
(r'([.sc]")(\s+?)', bygroups(String, Whitespace), 'stringdef'),
|
|
# keywords from the various wordsets
|
|
# *** Wordset BLOCK
|
|
(r'(blk|block|buffer|evaluate|flush|load|save-buffers|update|'
|
|
# *** Wordset BLOCK-EXT
|
|
r'empty-buffers|list|refill|scr|thru|'
|
|
# *** Wordset CORE
|
|
r'\#s|\*\/mod|\+loop|\/mod|0<|0=|1\+|1-|2!|'
|
|
r'2\*|2\/|2@|2drop|2dup|2over|2swap|>body|'
|
|
r'>in|>number|>r|\?dup|abort|abort\"|abs|'
|
|
r'accept|align|aligned|allot|and|base|begin|'
|
|
r'bl|c!|c,|c@|cell\+|cells|char|char\+|'
|
|
r'chars|constant|count|cr|create|decimal|'
|
|
r'depth|do|does>|drop|dup|else|emit|environment\?|'
|
|
r'evaluate|execute|exit|fill|find|fm\/mod|'
|
|
r'here|hold|i|if|immediate|invert|j|key|'
|
|
r'leave|literal|loop|lshift|m\*|max|min|'
|
|
r'mod|move|negate|or|over|postpone|quit|'
|
|
r'r>|r@|recurse|repeat|rot|rshift|s\"|s>d|'
|
|
r'sign|sm\/rem|source|space|spaces|state|swap|'
|
|
r'then|type|u\.|u\<|um\*|um\/mod|unloop|until|'
|
|
r'variable|while|word|xor|\[char\]|\[\'\]|'
|
|
r'@|!|\#|<\#|\#>|:|;|\+|-|\*|\/|,|<|>|\|1\+|1-|\.|'
|
|
# *** Wordset CORE-EXT
|
|
r'\.r|0<>|'
|
|
r'0>|2>r|2r>|2r@|:noname|\?do|again|c\"|'
|
|
r'case|compile,|endcase|endof|erase|false|'
|
|
r'hex|marker|nip|of|pad|parse|pick|refill|'
|
|
r'restore-input|roll|save-input|source-id|to|'
|
|
r'true|tuck|u\.r|u>|unused|value|within|'
|
|
r'\[compile\]|'
|
|
# *** Wordset CORE-EXT-obsolescent
|
|
r'\#tib|convert|expect|query|span|'
|
|
r'tib|'
|
|
# *** Wordset DOUBLE
|
|
r'2constant|2literal|2variable|d\+|d-|'
|
|
r'd\.|d\.r|d0<|d0=|d2\*|d2\/|d<|d=|d>s|'
|
|
r'dabs|dmax|dmin|dnegate|m\*\/|m\+|'
|
|
# *** Wordset DOUBLE-EXT
|
|
r'2rot|du<|'
|
|
# *** Wordset EXCEPTION
|
|
r'catch|throw|'
|
|
# *** Wordset EXCEPTION-EXT
|
|
r'abort|abort\"|'
|
|
# *** Wordset FACILITY
|
|
r'at-xy|key\?|page|'
|
|
# *** Wordset FACILITY-EXT
|
|
r'ekey|ekey>char|ekey\?|emit\?|ms|time&date|'
|
|
# *** Wordset FILE
|
|
r'BIN|CLOSE-FILE|CREATE-FILE|DELETE-FILE|FILE-POSITION|'
|
|
r'FILE-SIZE|INCLUDE-FILE|INCLUDED|OPEN-FILE|R\/O|'
|
|
r'R\/W|READ-FILE|READ-LINE|REPOSITION-FILE|RESIZE-FILE|'
|
|
r'S\"|SOURCE-ID|W/O|WRITE-FILE|WRITE-LINE|'
|
|
# *** Wordset FILE-EXT
|
|
r'FILE-STATUS|FLUSH-FILE|REFILL|RENAME-FILE|'
|
|
# *** Wordset FLOAT
|
|
r'>float|d>f|'
|
|
r'f!|f\*|f\+|f-|f\/|f0<|f0=|f<|f>d|f@|'
|
|
r'falign|faligned|fconstant|fdepth|fdrop|fdup|'
|
|
r'fliteral|float\+|floats|floor|fmax|fmin|'
|
|
r'fnegate|fover|frot|fround|fswap|fvariable|'
|
|
r'represent|'
|
|
# *** Wordset FLOAT-EXT
|
|
r'df!|df@|dfalign|dfaligned|dfloat\+|'
|
|
r'dfloats|f\*\*|f\.|fabs|facos|facosh|falog|'
|
|
r'fasin|fasinh|fatan|fatan2|fatanh|fcos|fcosh|'
|
|
r'fe\.|fexp|fexpm1|fln|flnp1|flog|fs\.|fsin|'
|
|
r'fsincos|fsinh|fsqrt|ftan|ftanh|f~|precision|'
|
|
r'set-precision|sf!|sf@|sfalign|sfaligned|sfloat\+|'
|
|
r'sfloats|'
|
|
# *** Wordset LOCAL
|
|
r'\(local\)|to|'
|
|
# *** Wordset LOCAL-EXT
|
|
r'locals\||'
|
|
# *** Wordset MEMORY
|
|
r'allocate|free|resize|'
|
|
# *** Wordset SEARCH
|
|
r'definitions|find|forth-wordlist|get-current|'
|
|
r'get-order|search-wordlist|set-current|set-order|'
|
|
r'wordlist|'
|
|
# *** Wordset SEARCH-EXT
|
|
r'also|forth|only|order|previous|'
|
|
# *** Wordset STRING
|
|
r'-trailing|\/string|blank|cmove|cmove>|compare|'
|
|
r'search|sliteral|'
|
|
# *** Wordset TOOLS
|
|
r'.s|dump|see|words|'
|
|
# *** Wordset TOOLS-EXT
|
|
r';code|'
|
|
r'ahead|assembler|bye|code|cs-pick|cs-roll|'
|
|
r'editor|state|\[else\]|\[if\]|\[then\]|'
|
|
# *** Wordset TOOLS-EXT-obsolescent
|
|
r'forget|'
|
|
# Forth 2012
|
|
r'defer|defer@|defer!|action-of|begin-structure|field:|buffer:|'
|
|
r'parse-name|buffer:|traverse-wordlist|n>r|nr>|2value|fvalue|'
|
|
r'name>interpret|name>compile|name>string|'
|
|
r'cfield:|end-structure)(?!\S)', Keyword),
|
|
|
|
# Numbers
|
|
(r'(\$[0-9A-F]+)', Number.Hex),
|
|
(r'(\#|%|&|\-|\+)?[0-9]+', Number.Integer),
|
|
(r'(\#|%|&|\-|\+)?[0-9.]+', Keyword.Type),
|
|
# amforth specific
|
|
(r'(@i|!i|@e|!e|pause|noop|turnkey|sleep|'
|
|
r'itype|icompare|sp@|sp!|rp@|rp!|up@|up!|'
|
|
r'>a|a>|a@|a!|a@+|a@-|>b|b>|b@|b!|b@+|b@-|'
|
|
r'find-name|1ms|'
|
|
r'sp0|rp0|\(evaluate\)|int-trap|int!)(?!\S)',
|
|
Name.Constant),
|
|
# a proposal
|
|
(r'(do-recognizer|r:fail|recognizer:|get-recognizers|'
|
|
r'set-recognizers|r:float|r>comp|r>int|r>post|'
|
|
r'r:name|r:word|r:dnum|r:num|recognizer|forth-recognizer|'
|
|
r'rec:num|rec:float|rec:word)(?!\S)', Name.Decorator),
|
|
# defining words. The next word is a new command name
|
|
(r'(Evalue|Rvalue|Uvalue|Edefer|Rdefer|Udefer)(\s+)',
|
|
bygroups(Keyword.Namespace, Text), 'worddef'),
|
|
|
|
(r'\S+', Name.Function), # Anything else is executed
|
|
|
|
],
|
|
'worddef': [
|
|
(r'\S+', Name.Class, '#pop'),
|
|
],
|
|
'stringdef': [
|
|
(r'[^"]+', String, '#pop'),
|
|
],
|
|
}
|
|
|
|
def analyse_text(text):
|
|
"""Forth uses : COMMAND ; quite a lot in a single line, so we're trying
|
|
to find that."""
|
|
if re.search('\n:[^\n]+;\n', text):
|
|
return 0.3
|