mirror of
https://github.com/russolsen/sallyforth
synced 2024-12-26 21:58:32 +01:00
Added :keywords, Token class.
This commit is contained in:
parent
a956438aec
commit
4473e149c3
1 changed files with 70 additions and 14 deletions
|
@ -1,5 +1,38 @@
|
||||||
import io
|
import io
|
||||||
|
|
||||||
|
def to_number(token):
|
||||||
|
try:
|
||||||
|
return int(token)
|
||||||
|
except ValueError:
|
||||||
|
try:
|
||||||
|
return float(token)
|
||||||
|
except ValueError:
|
||||||
|
return None
|
||||||
|
|
||||||
|
class Token:
|
||||||
|
def __init__(self, kind, value):
|
||||||
|
self.kind = kind
|
||||||
|
self.value = value
|
||||||
|
|
||||||
|
def isstring(self):
|
||||||
|
return self.kind == 'string'
|
||||||
|
|
||||||
|
def isword(self):
|
||||||
|
return self.kind == 'word'
|
||||||
|
|
||||||
|
def iskeyword(self):
|
||||||
|
return self.kind == 'keyword'
|
||||||
|
|
||||||
|
def isnumber(self):
|
||||||
|
return self.kind == 'number'
|
||||||
|
|
||||||
|
def __repr__(self):
|
||||||
|
return str(self)
|
||||||
|
|
||||||
|
def __str__(self):
|
||||||
|
return f'Token[{self.kind} => {self.value}]'
|
||||||
|
|
||||||
|
|
||||||
class PromptInputStream:
|
class PromptInputStream:
|
||||||
def __init__(self, prompt_f):
|
def __init__(self, prompt_f):
|
||||||
self.prompt_f = prompt_f
|
self.prompt_f = prompt_f
|
||||||
|
@ -25,19 +58,30 @@ class TokenStream:
|
||||||
return ch in [' ', '\t', '\n']
|
return ch in [' ', '\t', '\n']
|
||||||
|
|
||||||
def get_token(self):
|
def get_token(self):
|
||||||
|
t = self.x_get_token()
|
||||||
|
#print("GET token:", t)
|
||||||
|
return t
|
||||||
|
|
||||||
|
def x_get_token(self):
|
||||||
state = 'start'
|
state = 'start'
|
||||||
token = ''
|
token = ''
|
||||||
while True:
|
while True:
|
||||||
ch = self.read_f()
|
ch = self.read_f()
|
||||||
#print(f'ch: {ch} typech {type(ch)} state {state}')
|
#print(f'ch: {ch} typech {type(ch)} state {state}')
|
||||||
if ch in ['', None]:
|
if ch in ['', None]:
|
||||||
if state in ['word', 'sqstring', 'dqstring']:
|
if state in ['sqstring', 'dqstring']:
|
||||||
return [state, token]
|
return Token('string', token)
|
||||||
return ['eof', '']
|
if state in ['word']:
|
||||||
|
return Token('word', token)
|
||||||
|
return None
|
||||||
|
elif state == 'start' and ch == ':':
|
||||||
|
token = ch
|
||||||
|
state = 'keyword'
|
||||||
|
elif state == 'start' and ch in "+-0123456789":
|
||||||
|
token = ch
|
||||||
|
state = 'number'
|
||||||
elif state == 'start' and ch == '\\':
|
elif state == 'start' and ch == '\\':
|
||||||
state = 'lcomment'
|
state = 'lcomment'
|
||||||
elif state == 'start' and ch == '%':
|
|
||||||
return ['word', ch]
|
|
||||||
elif state == 'lcomment' and ch == '\n':
|
elif state == 'lcomment' and ch == '\n':
|
||||||
state = 'start'
|
state = 'start'
|
||||||
elif state == 'start' and ch == '(':
|
elif state == 'start' and ch == '(':
|
||||||
|
@ -49,16 +93,28 @@ class TokenStream:
|
||||||
elif state == 'start' and ch == '"':
|
elif state == 'start' and ch == '"':
|
||||||
state = 'dqstring'
|
state = 'dqstring'
|
||||||
elif state == 'dqstring' and ch == '"':
|
elif state == 'dqstring' and ch == '"':
|
||||||
return [state, token]
|
return Token('string', token)
|
||||||
elif state == 'start' and ch == "'":
|
elif state == 'start' and ch == "'":
|
||||||
state = 'sqstring'
|
state = 'sqstring'
|
||||||
elif state == 'start':
|
elif state == 'start':
|
||||||
state = 'word'
|
state = 'word'
|
||||||
token += ch
|
token += ch
|
||||||
elif state in ['word', 'sqstring'] and \
|
elif state == 'number' and self.whitespace(ch):
|
||||||
self.whitespace(ch):
|
n = to_number(token)
|
||||||
return state, token
|
if n:
|
||||||
elif state in ['word', 'dqstring', 'sqstring']:
|
return Token('number', n)
|
||||||
|
else:
|
||||||
|
return Token('word', token)
|
||||||
|
elif state == 'word' and self.whitespace(ch):
|
||||||
|
return Token('word', token)
|
||||||
|
elif state == 'sqstring' and self.whitespace(ch):
|
||||||
|
return Token('string', token)
|
||||||
|
elif state == 'keyword' and self.whitespace(ch):
|
||||||
|
state = 'start'
|
||||||
|
if len(token) == 1:
|
||||||
|
return Token('word', token)
|
||||||
|
return Token('keyword', token)
|
||||||
|
elif state in ['word', 'dqstring', 'sqstring', 'number', 'keyword']:
|
||||||
token += ch
|
token += ch
|
||||||
|
|
||||||
def file_token_stream(f):
|
def file_token_stream(f):
|
||||||
|
@ -83,7 +139,7 @@ if __name__ == "__main__":
|
||||||
pis = PromptInputStream(pmt)
|
pis = PromptInputStream(pmt)
|
||||||
ts = TokenStream(pis.getc)
|
ts = TokenStream(pis.getc)
|
||||||
|
|
||||||
kind, token = ts.get_token()
|
result = ts.get_token()
|
||||||
while kind != 'eof':
|
while result:
|
||||||
print(kind, token)
|
print("result:", result)
|
||||||
kind, token = ts.get_token()
|
result = ts.get_token()
|
||||||
|
|
Loading…
Reference in a new issue