2020-12-30 12:09:11 +01:00
|
|
|
h@l@h@!h@C+h!k1k0-h@$k
|
2020-12-30 13:17:09 +01:00
|
|
|
h@k1k0-+$h@C+h!ih@!h@C+h!kefh@!h@C+h!l!
|
|
|
|
h@l@h@!h@C+h!k1k0-h@$k h@k1k0-+$h@C+h!ih@!h@C+h!kefh@!h@C+h!l!
|
2020-12-30 12:09:11 +01:00
|
|
|
|
2020-12-30 16:52:36 +01:00
|
|
|
h@l@ h@!h@C+h! k1k0-h@$ k\h@k1k0-+$ h@C+h!
|
2020-12-30 14:00:20 +01:00
|
|
|
i h@!h@C+h!
|
|
|
|
kkf h@!h@C+h!
|
|
|
|
kLf h@!h@C+h!
|
|
|
|
k:k0- h@!h@C+h!
|
|
|
|
k=f h@!h@C+h!
|
|
|
|
kJf h@!h@C+h!
|
|
|
|
k0k5-C* h@!h@C+h!
|
|
|
|
kef h@!h@C+h!
|
|
|
|
l!
|
|
|
|
|
|
|
|
\ **Now we can use single-line comments!**
|
|
|
|
|
|
|
|
\ planckforth -
|
|
|
|
\ Copyright (C) 2020 nineties
|
|
|
|
|
2020-12-30 14:38:27 +01:00
|
|
|
\ This project aims to create a full-fledged Forth interpreter
|
|
|
|
\ by bootstrapping from hand-written tiny ELF binary.
|
|
|
|
|
|
|
|
\ In the 1st stage, only single character words are registered
|
|
|
|
\ in the dictionary.
|
|
|
|
\ List of builtin words:
|
|
|
|
\ 'Q' ( -- ) Exit the process
|
|
|
|
\ 'C' ( -- n ) The size of Cells
|
|
|
|
\ 'h' ( -- addr ) The address of 'here' cell
|
|
|
|
\ 'l' ( -- addr ) The address of 'latest' cell
|
|
|
|
\ 'k' ( -- c ) Read character
|
|
|
|
\ 't' ( c -- ) Print character
|
|
|
|
\ 'j' ( -- ) Unconditional branch
|
|
|
|
\ 'J' ( a -- ) Jump if a == 0
|
|
|
|
\ 'f' ( c -- xt ) Get execution token of c
|
|
|
|
\ 'x' ( xt -- ... ) Run the execution token
|
|
|
|
\ '@' ( addr -- a ) Load value from addr
|
|
|
|
\ '!' ( a addr -- ) Store value to addr
|
|
|
|
\ '?' ( addr -- c ) Load byte from addr
|
|
|
|
\ '$' ( c addr -- ) Store byte to addr
|
|
|
|
\ 'd' ( -- addr ) Get data stack pointer
|
|
|
|
\ 'D' ( addr -- ) Set data stack pointer
|
|
|
|
\ 'r' ( -- addr ) Get return stack pointer
|
|
|
|
\ 'R' ( addr -- ) Set return stack pointer
|
|
|
|
\ 'i' ( -- addr ) Get the interpreter function
|
|
|
|
\ 'e' ( -- ) Exit current function
|
|
|
|
\ 'L' ( -- a ) Load immediate
|
|
|
|
\ 'S' ( -- addr len) Load string literal
|
|
|
|
\ '+' ( a b -- c ) c = (a + b)
|
|
|
|
\ '-' ( a b -- c ) c = (a - b)
|
|
|
|
\ '*' ( a b -- c ) c = (a * b)
|
|
|
|
\ '/' ( a b -- c ) c = (a / b)
|
|
|
|
\ '%' ( a b -- c ) c = (a % b)
|
|
|
|
\ '&' ( a b -- c ) c = (a & b)
|
|
|
|
\ '|' ( a b -- c ) c = (a | b)
|
|
|
|
\ '^' ( a b -- c ) c = (a ^ b)
|
|
|
|
\ '<' ( a b -- c ) c = (a < b)
|
|
|
|
\ '=' ( a b -- c ) c = (a == b
|
|
|
|
|
|
|
|
\ The 1st stage interpreter repeats execution of k, f and x.
|
|
|
|
\ There is no concept such as IMMEDIATE mode yet.
|
|
|
|
|
|
|
|
\ There following line is an example program of planckforth
|
|
|
|
\ which prints "Hello World!\n"
|
|
|
|
\ --
|
|
|
|
\ kHtketkltkltkotk tkWtkotkrtkltkdtk!tk:k0-tQ
|
|
|
|
\ --
|
|
|
|
\ This code repeats that 'k' reads a character and 't' prints it.
|
|
|
|
\ Note that ':' (58) minus '0' (48) is '\n' (10).
|
|
|
|
|
|
|
|
\ The structure of the dictionary is sames as many Forth implementation.
|
|
|
|
\ +------+----------+---------+------------+---------------+
|
|
|
|
\ | link | len+flag | name... | padding... | code field ...|
|
|
|
|
\ +------+----------+---------+------------+---------------+
|
|
|
|
\ - link pointer to the previous entry (CELL byte)
|
2021-01-01 10:37:41 +01:00
|
|
|
\ - length of the name (6 bits)
|
|
|
|
\ - smudge bit (1 bit)
|
|
|
|
\ - immediate bit (1 bit)
|
2020-12-30 14:38:27 +01:00
|
|
|
\ - characters of the name (N bits)
|
|
|
|
\ - padding to align CELL boundary if necessary.
|
|
|
|
\ - codewords and datawords (CELL-bye aligned)
|
|
|
|
|
|
|
|
\ The code group at the beginning of this file
|
|
|
|
\ defines ' ' and '\n' as no-op operation and
|
|
|
|
\ '\' to read following characters until '\n'.
|
|
|
|
\ Since I couldn't write a comment at the beginning,
|
|
|
|
\ I repost the definition of '\' for explanation.
|
|
|
|
\ --
|
|
|
|
\ h@ ( save addr of new entry )
|
|
|
|
\ l@ h@!h@C+h! ( set link pointer. *here++ = latest )
|
2020-12-30 14:41:49 +01:00
|
|
|
\ k1k0-h@$ k\h@k1k0-+$ h@C+h! ( write the name '\' and its length )
|
2020-12-30 14:38:27 +01:00
|
|
|
\ i h@!h@C+h! ( docol )
|
|
|
|
\ kkf h@!h@C+h! ( key )
|
|
|
|
\ kLf h@!h@C+h! ( lit )
|
|
|
|
\ k:k0- h@!h@C+h! ( '\n' )
|
|
|
|
\ k=f h@!h@C+h! ( = )
|
|
|
|
\ kJf h@!h@C+h! ( branch )
|
|
|
|
\ k0k5-C* h@!h@C+h! ( -5*CELL )
|
|
|
|
\ kef h@!h@C+h! ( exit )
|
|
|
|
\ l! ( set latest to this new entry. )
|
|
|
|
\ --
|
|
|
|
|
2020-12-30 14:48:07 +01:00
|
|
|
\ That's all for the brief explanation. Let's restart bootstrap!
|
|
|
|
|
2020-12-30 14:51:29 +01:00
|
|
|
\ The COMMA operator
|
|
|
|
\ ',' ( a -- ) Store a to 'here' and increment 'here' CELL bytes.
|
2020-12-30 16:52:36 +01:00
|
|
|
h@l@ h@!h@C+h! k1k0-h@$ k,h@k1k0-+$ h@C+h!
|
2020-12-30 14:51:29 +01:00
|
|
|
i h@!h@C+h! \ docol
|
2020-12-30 15:23:07 +01:00
|
|
|
\ store 'a' to here
|
2020-12-30 14:51:29 +01:00
|
|
|
khf h@!h@C+h!
|
|
|
|
k@f h@!h@C+h!
|
2020-12-30 15:23:07 +01:00
|
|
|
k!f h@!h@C+h!
|
|
|
|
\ here <- here + CELL
|
2020-12-30 14:51:29 +01:00
|
|
|
khf h@!h@C+h!
|
|
|
|
k@f h@!h@C+h!
|
|
|
|
kCf h@!h@C+h!
|
2020-12-30 15:23:07 +01:00
|
|
|
k+f h@!h@C+h!
|
2020-12-30 14:51:29 +01:00
|
|
|
khf h@!h@C+h!
|
2020-12-30 15:23:07 +01:00
|
|
|
k!f h@!h@C+h!
|
|
|
|
\ exit
|
|
|
|
kef h@!h@C+h!
|
2020-12-30 14:51:29 +01:00
|
|
|
l!
|
|
|
|
|
2020-12-30 15:42:38 +01:00
|
|
|
\ TICK-like operator
|
|
|
|
\ '\'' ( "c" -- xt ) Get execution token of following character
|
|
|
|
\ NB: This definition is different from the usual definition of tick
|
|
|
|
\ because it does not skip leading spaces and can read only a single
|
|
|
|
\ character. It will be redefined in later stage.
|
2020-12-30 16:52:36 +01:00
|
|
|
h@l@, k1k0-h@$ k'h@k1k0-+$ h@C+h!
|
2020-12-30 15:42:38 +01:00
|
|
|
i, kkf, kff, kef,
|
|
|
|
l!
|
|
|
|
|
2020-12-30 16:52:53 +01:00
|
|
|
\ Utility for defining a word
|
|
|
|
\ 'c' ( "c" -- w )
|
|
|
|
\ Read character, create new word then push its address.
|
|
|
|
\ 'latest' will not be updated.
|
|
|
|
h@l@, k1k0-h@$ kch@k1k0-+$ h@C+h!
|
|
|
|
i, 'h, '@, 'l, '@, ',,
|
|
|
|
'L, k1k0-, 'h, '@, '$,
|
|
|
|
'k, 'h, '@, 'L, k1k0-, '+, '$,
|
2020-12-31 00:26:06 +01:00
|
|
|
'h, '@, 'C, '+, 'h, '!,
|
|
|
|
'e, l!
|
2020-12-30 16:52:53 +01:00
|
|
|
|
2020-12-30 16:59:24 +01:00
|
|
|
\ '_' ( a -- ) DROP
|
|
|
|
c_ i, 'd, 'C, '+, 'D, 'e, l!
|
|
|
|
|
2020-12-30 22:25:40 +01:00
|
|
|
\ '#' ( a -- a a ) DUP
|
|
|
|
c# i, 'd, '@, 'e, l!
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
\ Implementations of TOR and FROMR are a bit tricky.
|
|
|
|
\ Since return-address will be placed at the top of return stack,
|
|
|
|
\ the code in the body of these function have to manipulate
|
|
|
|
\ 2nd element of the stack.
|
|
|
|
|
|
|
|
\ '{' ( a -- R:a ) TOR
|
|
|
|
\ Move value from data stack to return stack.
|
2020-12-31 00:26:06 +01:00
|
|
|
c{ i,
|
2020-12-30 22:25:40 +01:00
|
|
|
'r, 'r, '@, \ ( a rsp ret )
|
2020-12-30 22:36:20 +01:00
|
|
|
'r, 'C, '-, '#, \ ( a rsp ret rsp-1 rsp-1 )
|
|
|
|
'R, \ ( a rsp+1 ret rsp ) extend return stack
|
|
|
|
'!, \ ( a rsp+1 ) store return address to the top
|
2020-12-30 22:25:40 +01:00
|
|
|
'!, \ store a to the 2nd
|
2020-12-31 00:26:06 +01:00
|
|
|
'e, l!
|
2020-12-30 22:25:40 +01:00
|
|
|
|
|
|
|
\ '}' ( R:a -- a ) FROMR
|
|
|
|
\ Move value from return stack to data stack.
|
2020-12-31 00:26:06 +01:00
|
|
|
c} i,
|
2020-12-30 22:25:40 +01:00
|
|
|
'r, 'C, '+, '@, \ ( a ) load 2nd value
|
|
|
|
'r, '@, \ ( a ret ) load return addr
|
2020-12-30 22:36:20 +01:00
|
|
|
'r, 'C, '+, '#, \ ( a ret rsp+1 rsp+1 )
|
2020-12-30 22:25:40 +01:00
|
|
|
'R, \ ( a ret rsp ) reduce return stack
|
|
|
|
'!, \ ( a , R:ret ) store return addr to top of return stack
|
2020-12-31 00:26:06 +01:00
|
|
|
'e, l!
|
2020-12-30 22:25:40 +01:00
|
|
|
|
2020-12-30 22:39:43 +01:00
|
|
|
\ 'o' ( a b -- a b a ) OVER
|
|
|
|
co i, 'd, 'C, '+, '@, 'e, l!
|
2020-12-30 22:37:08 +01:00
|
|
|
|
|
|
|
\ '~' ( a b -- b a ) SWAP
|
|
|
|
c~ i,
|
2020-12-30 22:39:43 +01:00
|
|
|
'o, \ ( a b a )
|
2020-12-30 22:37:08 +01:00
|
|
|
'{, \ ( a b , R:a )
|
|
|
|
'd, 'C, '+, \ ( a b sp+1 , R:a )
|
|
|
|
'!, \ ( b , R:a )
|
|
|
|
'}, \ ( b a )
|
2020-12-31 00:26:06 +01:00
|
|
|
'e, l!
|
2020-12-30 22:37:08 +01:00
|
|
|
|
2020-12-30 23:50:02 +01:00
|
|
|
\ 'B' ( c -- ) C-COMMA
|
|
|
|
\ Store byte 'c' to here and increment it
|
2020-12-31 01:40:29 +01:00
|
|
|
cB i, 'h, '@, '$, 'h, '@, 'L, k1k0-, '+, 'h, '!, 'e, l!
|
2020-12-30 22:39:43 +01:00
|
|
|
|
2020-12-31 11:36:45 +01:00
|
|
|
\ 'm' ( c-addr u -- ) CMOVE,
|
|
|
|
\ Copy u bytes from c-addr to here,
|
|
|
|
\ increment here u bytes.
|
2020-12-31 05:10:18 +01:00
|
|
|
cm i,
|
|
|
|
\ <loop>
|
2020-12-31 11:36:45 +01:00
|
|
|
'#, 'J, k>k0-C*, \ goto <exit> if u=0
|
2020-12-31 05:10:18 +01:00
|
|
|
'{, \ preserve u
|
2020-12-31 11:36:45 +01:00
|
|
|
'#, '?, 'B, \ copy byte
|
|
|
|
'L, k1k0-, '+, \ increment c-addr
|
2020-12-31 05:10:18 +01:00
|
|
|
'}, 'L, k1k0-, '-, \ decrement u
|
2020-12-31 11:36:45 +01:00
|
|
|
'j, k0k?-C*, \ goto <loop>
|
2020-12-31 05:10:18 +01:00
|
|
|
\ <exit>
|
2020-12-31 11:36:45 +01:00
|
|
|
'_, '_,
|
2020-12-31 05:10:18 +01:00
|
|
|
'e, l!
|
|
|
|
|
2020-12-31 00:09:22 +01:00
|
|
|
\ 'a' ( c-addr -- a-addr ) ALIGNED
|
2020-12-31 16:42:30 +01:00
|
|
|
\ Round up to a nearlest multiple of CELL
|
2020-12-31 00:09:22 +01:00
|
|
|
ca i,
|
2020-12-31 00:13:42 +01:00
|
|
|
'L, Ck1k0--, '+, \ ( a+CELL-1 )
|
|
|
|
'L, k0k0-C-, \ ( a+CELL-1 ~(CELL-1) )
|
2020-12-31 00:26:06 +01:00
|
|
|
'&,
|
|
|
|
'e, l!
|
2020-12-31 00:09:22 +01:00
|
|
|
|
|
|
|
\ 'A' ( -- ) ALIGN
|
2020-12-31 16:42:30 +01:00
|
|
|
\ Round up 'here' to a nearlest multiple of CELL
|
2020-12-31 00:09:22 +01:00
|
|
|
cA i, 'h, '@, 'a, 'h, '!, 'e, l!
|
|
|
|
|
2020-12-31 01:40:42 +01:00
|
|
|
\ 'E' ( c-addr1 u1 c-addr2 u2 -- n ) STR=
|
|
|
|
\ Compare two strings.
|
|
|
|
\ Return 1 if they are same 0 otherwise.
|
|
|
|
cE i,
|
|
|
|
'{, '~, '}, \ ( c-addr1 c-addr2 u1 u2 )
|
|
|
|
'o, '=, 'J, kVk0-C*, \ jump to <not_equal> if u1!=u2
|
|
|
|
\ <loop>
|
|
|
|
\ ( c-addr1 c-addr2 u )
|
|
|
|
'#, 'J, kMk0-C*, \ jump to <equal> if u==0
|
|
|
|
'{, \ preserve u
|
|
|
|
'o, '?, \ ( c-addr1 c-addr2 c1 )
|
|
|
|
'o, '?, \ ( c-addr1 c-addr2 c1 c2 )
|
2020-12-31 01:52:17 +01:00
|
|
|
'}, \ ( c-addr1 c-addr2 c1 c2 u ) restore u
|
2020-12-31 01:40:42 +01:00
|
|
|
'~, '{, '~, '}, \ ( c-addr1 c-addr2 u c1 c2 )
|
|
|
|
'=, 'J, kFk0-C*, \ jump to <not_equal> if c1!=c2
|
|
|
|
'{, '{, \ ( c-addr1 , R:u c-addr2 )
|
|
|
|
'L, k1k0-, '+, \ increment c-addr1
|
|
|
|
'}, 'L, k1k0-, '+, \ increment c-addrr2
|
|
|
|
'}, 'L, k1k0-, '-, \ decrement u
|
|
|
|
'j, k0kN-C*, \ jump to <loop>
|
|
|
|
\ <equal>
|
|
|
|
'_, '_, '_, 'L, k1k0-, 'e,
|
|
|
|
\ <not_equal>
|
|
|
|
'_, '_, '_, 'L, k0k0-, 'e,
|
|
|
|
l!
|
|
|
|
|
2020-12-31 03:59:09 +01:00
|
|
|
\ 's' ( c -- n)
|
|
|
|
\ Return 1 if c==' ' or c=='\n', 0 otherwise.
|
|
|
|
cs i, '#, 'L, k , '=, '~, 'L, k:k0-, '=, '|, 'e, l!
|
|
|
|
|
2020-12-31 12:42:43 +01:00
|
|
|
\ 'W' ( "name" -- c-addr u )
|
2020-12-31 03:59:09 +01:00
|
|
|
\ Skip leading spaces (' ' and '\n'),
|
|
|
|
\ Read name, then return its address and length.
|
2021-01-01 10:37:41 +01:00
|
|
|
\ The maximum length of the name is 63. The behavior is undefined
|
|
|
|
\ when the name exceeds 63 characters,
|
2020-12-31 03:59:09 +01:00
|
|
|
\ Note that it returns the address of statically allocated buffer,
|
|
|
|
\ so the content will be overwritten each time 'w' executed.
|
|
|
|
|
2021-01-01 10:37:41 +01:00
|
|
|
\ Allocate buffer of 63 bytes or more,
|
2020-12-31 03:59:09 +01:00
|
|
|
\ push the address for compilation of 'w'
|
2021-01-01 10:37:41 +01:00
|
|
|
h@ # kok0-+ h! A
|
2020-12-31 06:44:39 +01:00
|
|
|
cW~
|
2020-12-31 03:59:09 +01:00
|
|
|
i,
|
|
|
|
\ skip leading spaces
|
|
|
|
'k, '#, 's, 'J, k4k0-C*, '_, 'j, k0k7-C*,
|
|
|
|
\ p=address of buffer
|
|
|
|
'L, #, '~,
|
|
|
|
\ <loop>
|
|
|
|
\ ( p c )
|
|
|
|
'o, '$, \ store c to p
|
|
|
|
'L, k1k0-, '+, \ increment p
|
|
|
|
'k, '#, 's, 'J, k0k9-C*, \ goto <loop> if c is not space
|
|
|
|
'_, 'L, , \ ( p buf )
|
|
|
|
'~, 'o, '-, \ ( buf p-buf )
|
|
|
|
'e, l!
|
|
|
|
|
2020-12-31 05:27:25 +01:00
|
|
|
\ 'F' ( c-addr u -- w )
|
|
|
|
\ Lookup multi-character word from dictionary.
|
2020-12-31 07:10:54 +01:00
|
|
|
\ Return 0 if the word is not found.
|
2021-01-01 10:37:41 +01:00
|
|
|
\ Entries with smudge-bit=1 are ignored.
|
2020-12-31 05:27:25 +01:00
|
|
|
cF i,
|
2020-12-31 06:45:02 +01:00
|
|
|
'l, '@,
|
|
|
|
\ <loop> ( addr u it )
|
2021-01-01 10:37:41 +01:00
|
|
|
'#, 'J, kUk0-C*, \ goto <exit> if it=NULL
|
|
|
|
'#, 'C, '+, '?, \ ( addr u it len+flag )
|
|
|
|
'L, k@, '&, \ test smudge-bit of it
|
|
|
|
'J, k4k0-C*,
|
2020-12-31 05:27:25 +01:00
|
|
|
\ <1>
|
2021-01-01 10:37:41 +01:00
|
|
|
\ smudge-bit=1
|
|
|
|
'@, \ load link
|
|
|
|
'j, k0k>-C*, \ goto <loop>
|
|
|
|
\ <2>
|
|
|
|
\ smudge-bit=0
|
|
|
|
'{, 'o, 'o, 'r, '@, '~, '{, '~, '}, '},
|
|
|
|
\ ( addr u it addr u it )
|
|
|
|
'#, 'L, Ck1k0-+, '+, \ address of name
|
|
|
|
'~, 'C, '+, '?, \ length+flag
|
|
|
|
'L, kok0-, '&, \ take length (lower 6-bits)
|
|
|
|
\ ( addr1 u1 it addr1 u1 addr2 u2 )
|
|
|
|
'E, 'J, k0kJ-C*, \ goto <1> if different name
|
2020-12-31 05:27:25 +01:00
|
|
|
\ <exit>
|
2020-12-31 06:45:02 +01:00
|
|
|
'{, '_, '_, '}, \ Drop addr u return it
|
2020-12-31 05:27:25 +01:00
|
|
|
'e, l!
|
2020-12-31 05:10:18 +01:00
|
|
|
|
2020-12-31 07:10:54 +01:00
|
|
|
\ 'G' ( w -- xt )
|
|
|
|
\ Get CFA of the word
|
|
|
|
cG i,
|
|
|
|
'C, '+, '#, '?, \ ( addr len+flag )
|
2021-01-01 10:37:41 +01:00
|
|
|
'L, kok0-, '&, \ take length
|
2020-12-31 07:10:54 +01:00
|
|
|
'+, \ add length to the addr
|
|
|
|
'L, k1k0-, '+, \ add 1 to the addr (1byte for len+field)
|
|
|
|
'a, \ align
|
|
|
|
'e, l!
|
2020-12-31 07:52:39 +01:00
|
|
|
|
2020-12-31 09:46:11 +01:00
|
|
|
\ 'M' ( -- c-addr)
|
|
|
|
\ The state variable
|
2020-12-31 07:52:39 +01:00
|
|
|
\ 0: immediate mode
|
|
|
|
\ 1: compile mode
|
2020-12-31 09:46:11 +01:00
|
|
|
h@ k0k0-, \ allocate 1 cell and fill 0
|
|
|
|
cM~ i, 'L, , 'e, l!
|
2020-12-31 07:52:39 +01:00
|
|
|
|
2020-12-31 10:04:08 +01:00
|
|
|
\ 'I'
|
|
|
|
\ The 2nd Stage Interpreter
|
|
|
|
cI i,
|
|
|
|
\ <loop>
|
2020-12-31 10:23:02 +01:00
|
|
|
'W, \ read name from input
|
|
|
|
'F, \ find word
|
|
|
|
'M, '@, \ read state
|
|
|
|
'J, kAk0-C*, \ goto <immediate> if state=0
|
|
|
|
\ <compile>
|
|
|
|
'#, 'C, '+, '?, \ ( w len+flag )
|
|
|
|
'L, k@k@+, '&, \ test immediate bit
|
|
|
|
'L, k0k0-, '=,
|
|
|
|
'J, k5k0-C*, \ goto <immediate> if immediate-bit=1
|
|
|
|
'G, ',, \ compile CFA
|
2020-12-31 12:22:51 +01:00
|
|
|
'j, k0kE-C*, \ goto <loop>
|
2020-12-31 10:23:02 +01:00
|
|
|
\ <immediate>
|
|
|
|
'G, 'x, \ execute CFA
|
|
|
|
'j, k0kI-C*, \ goto <loop>
|
2020-12-31 10:04:08 +01:00
|
|
|
l!
|
|
|
|
|
2020-12-31 11:01:57 +01:00
|
|
|
I \ Enter 2nd Stage
|
|
|
|
|
|
|
|
\ === 2nd Stage Interpreter ===
|
|
|
|
|
|
|
|
r C + R \ Drop 1st stage interpreter from call stack
|
|
|
|
|
2020-12-31 13:06:22 +01:00
|
|
|
\ '\'' ( "name" -- xt )
|
|
|
|
\ Redefine existing '\'' which uses 'k' and 'f'
|
|
|
|
\ to use 'W' and 'F'.
|
|
|
|
c ' i , ' W , ' F , ' G , ' e , l !
|
|
|
|
|
|
|
|
\ [ immediate ( -- )
|
|
|
|
\ Switch to immediate mode
|
|
|
|
c [ i , ' L , k 0 k 0 - , ' M , ' ! , ' e , l !
|
2020-12-31 15:32:07 +01:00
|
|
|
\ Set immediate-bit of [
|
2020-12-31 13:06:22 +01:00
|
|
|
l @ C + # { ? k @ k @ + | } $
|
|
|
|
|
|
|
|
\ ] ( -- )
|
|
|
|
\ Switch to compile mode
|
|
|
|
c ] i , ' L , k 1 k 0 - , ' M , ' ! , ' e , l !
|
2020-12-31 12:23:08 +01:00
|
|
|
|
2021-01-01 10:37:41 +01:00
|
|
|
\ : ( "name" -- ) COLON
|
|
|
|
\ Read name, create word with smudge=1,
|
2020-12-31 12:23:08 +01:00
|
|
|
\ compile 'docol' and enter compile mode.
|
|
|
|
c : i ,
|
2020-12-31 16:23:27 +01:00
|
|
|
' h , ' @ ,
|
2020-12-31 12:23:08 +01:00
|
|
|
' l , ' @ , ' , , \ fill link
|
2021-01-01 10:37:41 +01:00
|
|
|
' l , ' ! , \ update latest
|
2020-12-31 12:23:08 +01:00
|
|
|
' W , \ read name ( addr len )
|
2021-01-01 10:37:41 +01:00
|
|
|
' # , \ ( addr len len )
|
|
|
|
' L , k @ , ' | ,
|
|
|
|
' B , \ fill length + smudge-bit
|
2020-12-31 12:23:08 +01:00
|
|
|
' m , \ fill name
|
|
|
|
' A , \ align here
|
|
|
|
' i , ' , , \ compile docol
|
2020-12-31 13:06:22 +01:00
|
|
|
' ] , \ enter compile mode
|
2020-12-31 12:23:08 +01:00
|
|
|
' e , l !
|
|
|
|
|
2021-01-01 10:37:41 +01:00
|
|
|
\ ; ( -- ) SEMICOLON
|
|
|
|
\ Compile 'exit', unsmudge latest, and enter immediate mode.
|
2020-12-31 12:23:08 +01:00
|
|
|
c ; i ,
|
|
|
|
' L , ' e , ' , , \ compile exit
|
2021-01-01 10:37:41 +01:00
|
|
|
' l , ' @ ,
|
|
|
|
' C , ' + , ' # , ' ? ,
|
|
|
|
' L , k [ k d + , \ 0xbf
|
|
|
|
' & , ' ~ , ' $ , \ unsmudge
|
|
|
|
' [ , \ enter immediate mode
|
2020-12-31 12:23:08 +01:00
|
|
|
' e , l !
|
2020-12-31 15:32:07 +01:00
|
|
|
\ Set immediate-bit of ';'
|
2020-12-31 12:23:08 +01:00
|
|
|
l @ C + # { ? k @ k @ + | } $
|
|
|
|
|
2021-01-01 10:37:41 +01:00
|
|
|
: immediate-bit [ ' L , k @ k @ + , ] ; \ 0x80
|
|
|
|
: smudge-bit [ ' L , k @ , ] ; \ 0x40
|
|
|
|
: length-mask [ ' L , k o k 0 - , ] ; \ 0x3f
|
2020-12-31 15:34:56 +01:00
|
|
|
|
|
|
|
\ ( "name" -- )
|
|
|
|
: set-immediate
|
|
|
|
W F C + # { ? immediate-bit | } $
|
|
|
|
;
|
|
|
|
|
|
|
|
\ Set immediate-bit of single-line comment word \
|
|
|
|
\ so that we can write comments in compile-mode.
|
|
|
|
set-immediate \
|
2020-12-31 15:47:37 +01:00
|
|
|
|
2021-01-01 10:37:41 +01:00
|
|
|
\ Set immediate-bit of 'latest'
|
2021-01-01 00:23:45 +01:00
|
|
|
: immediate
|
2021-01-01 10:37:41 +01:00
|
|
|
l @ C + # { ? immediate-bit | } $
|
2021-01-01 00:23:45 +01:00
|
|
|
;
|
|
|
|
|
2020-12-31 15:47:37 +01:00
|
|
|
: alias-builtin \ ( "name-new" "name-old" -- )
|
|
|
|
\ Create new word "name-new".
|
|
|
|
\ Copy code pointer of builtin word "name-old" to
|
|
|
|
\ the new word "name-new".
|
|
|
|
\ "name-old" must not be a FORTH word.
|
|
|
|
h @ l @ , l ! \ fill link, update latest
|
|
|
|
W # B m A \ fill length and chars of "name-new"
|
|
|
|
W F G @ , \ fill code-pointer of "name-old"
|
|
|
|
;
|
|
|
|
|
2020-12-31 16:04:21 +01:00
|
|
|
\ Add new names to builtin primities.
|
|
|
|
\ Instead of defining as a new FORTH word like shown below,
|
|
|
|
\ the aliases ared created by copying their code-pointer.
|
|
|
|
\ : new-name old-name ;
|
|
|
|
\ Primitive operators which manipulate program counter and return stack
|
|
|
|
\ can not be defined as a FORTH word.
|
|
|
|
|
2020-12-31 15:47:37 +01:00
|
|
|
alias-builtin bye Q
|
|
|
|
alias-builtin cell C
|
|
|
|
alias-builtin here h
|
|
|
|
alias-builtin latest l
|
|
|
|
alias-builtin key k
|
|
|
|
alias-builtin emit t
|
|
|
|
alias-builtin branch j
|
|
|
|
alias-builtin 0branch J
|
|
|
|
alias-builtin execute x
|
|
|
|
alias-builtin c@ ?
|
|
|
|
alias-builtin c! $
|
|
|
|
alias-builtin sp@ d
|
|
|
|
alias-builtin sp! D
|
|
|
|
alias-builtin rp@ r
|
|
|
|
alias-builtin rp! R
|
|
|
|
alias-builtin docol i
|
|
|
|
alias-builtin exit e
|
|
|
|
alias-builtin lit L
|
|
|
|
alias-builtin litstring S
|
|
|
|
alias-builtin div /
|
|
|
|
alias-builtin mod %
|
|
|
|
alias-builtin and &
|
|
|
|
alias-builtin or |
|
|
|
|
alias-builtin xor ^
|
|
|
|
|
2021-01-01 10:37:41 +01:00
|
|
|
\ Rename existing FORTH words
|
|
|
|
: word W ;
|
|
|
|
: find F ;
|
2021-01-01 12:11:30 +01:00
|
|
|
: >cfa G ;
|
2021-01-01 10:37:41 +01:00
|
|
|
|
|
|
|
\ === Compilers ===
|
|
|
|
|
|
|
|
\ compile: ( n -- )
|
|
|
|
\ runtime: ( -- n )
|
|
|
|
: literal
|
|
|
|
lit lit , \ compile lit
|
|
|
|
, \ compile n
|
|
|
|
; immediate
|
|
|
|
|
|
|
|
\ compile: ( "name" -- )
|
|
|
|
\ '[compile] word' compiles word *now* even if it is immediate
|
|
|
|
: [compile]
|
|
|
|
' ,
|
|
|
|
; immediate
|
|
|
|
|
|
|
|
\ ( xt -- )
|
|
|
|
\ postpone compilation of xt
|
|
|
|
: (compile)
|
|
|
|
[compile] literal \ compile 'literal'
|
|
|
|
[ ' , ] literal , \ compile ,
|
|
|
|
;
|
|
|
|
|
|
|
|
\ compile: ( "name" -- )
|
|
|
|
\ 'compile word' compiles word *later* even if it is immediate
|
|
|
|
: compile
|
|
|
|
' (compile)
|
|
|
|
; immediate
|
|
|
|
|
|
|
|
\ ( -- xt )
|
|
|
|
: :noname
|
|
|
|
here @
|
|
|
|
[ docol ] literal , \ compile docol
|
|
|
|
] \ enter compile mode
|
|
|
|
;
|
|
|
|
|
|
|
|
\ ( "name" -- xt )
|
|
|
|
\ compile time tick
|
|
|
|
: [']
|
|
|
|
' \ read name and get xt
|
|
|
|
[compile] literal \ call literal
|
|
|
|
; immediate
|
|
|
|
|
|
|
|
\ === Constants ===
|
|
|
|
|
2021-01-01 10:54:42 +01:00
|
|
|
\ Since we don't have integer literals yet,
|
|
|
|
\ define small integer words for convenience
|
|
|
|
\ and readability.
|
|
|
|
: 0 [ key 0 key 0 - ] literal ;
|
|
|
|
: 1 [ key 1 key 0 - ] literal ;
|
|
|
|
: 2 [ key 2 key 0 - ] literal ;
|
|
|
|
: 3 [ key 3 key 0 - ] literal ;
|
2021-01-01 10:37:41 +01:00
|
|
|
|
|
|
|
: true 1 ;
|
|
|
|
: false 0 ;
|
|
|
|
|
|
|
|
\ === Address Arithmetic ===
|
|
|
|
|
|
|
|
: cell+ cell + ;
|
|
|
|
: cell- cell - ;
|
|
|
|
: cells cell * ;
|
|
|
|
|
|
|
|
\ ( c-addr -- a-addr )
|
|
|
|
\ Round up to nearlest multiple of CELL
|
|
|
|
: aligned
|
|
|
|
cell + 1 -
|
|
|
|
0 cell -
|
|
|
|
and
|
|
|
|
;
|
|
|
|
|
|
|
|
\ ( -- )
|
|
|
|
\ Round up 'here' to nearlest multiple to CELL
|
|
|
|
: align here @ aligned here ! ;
|
|
|
|
|
|
|
|
\ === Stack Manipulation ===
|
|
|
|
|
|
|
|
: drop sp@ cell+ sp! ; \ ( w -- )
|
|
|
|
: dup sp@ @ ; \ ( w -- w w )
|
|
|
|
|
|
|
|
: >r rp@ rp@ @ rp@ cell - dup rp! ! ! ; \ ( w -- R:w )
|
|
|
|
: r> rp@ cell + @ rp@ @ rp@ cell + dup rp! ! ; \ ( R:w -- w)
|
|
|
|
|
|
|
|
: swap sp@ cell + dup @ >r ! r> ; \ ( a b -- b a )
|
|
|
|
: rot >r swap r> swap ; \ ( a b c -- b c a )
|
|
|
|
: -rot swap >r swap r> ; \ ( a b c -- c a b )
|
|
|
|
: nip swap drop ; \ ( a b -- a )
|
|
|
|
: over >r dup r> swap ; \ ( a b -- a b a )
|
|
|
|
: tuck dup -rot ; \ ( a b -- b a b )
|
|
|
|
: pick cells sp@ swap + cell + @ ; \ ( wu ... x0 u -- xu ... x0 xu )
|
|
|
|
|
|
|
|
: 2drop drop drop ; \ ( a b -- )
|
|
|
|
: 2dup over over ; \ ( a b -- a b a b )
|
|
|
|
: 2swap >r -rot r> -rot ; \ ( a b c d -- c d a b )
|
|
|
|
: 2nip 2swap 2drop ; \ ( a b c d -- c d )
|
|
|
|
: 2over 3 pick 3 pick ; \ ( a b c d -- a b c d a b )
|
|
|
|
: 2tuck 2swap 2over ; \ ( a b c d -- c d a b c d )
|
|
|
|
: 2rot >r >r 2swap r> r> 2swap ; \ ( a b c d e f -- c d e f a b )
|
|
|
|
: -2rot 2swap >r >r 2swap r> r> ; \ ( a b c d e f -- e f a b c d )
|
|
|
|
|
|
|
|
: rdrop r> rp@ ! ; \ ( R:w -- )
|
|
|
|
|
|
|
|
\ ( -- a-addr )
|
|
|
|
\ The bottom address of stacks.
|
|
|
|
\ sp@ and rp@ points bottom if implementation so far is correct.
|
2021-01-01 10:54:42 +01:00
|
|
|
: sp0 [ sp@ ] literal ;
|
|
|
|
: rp0 [ rp@ ] literal ;
|
2021-01-01 10:37:41 +01:00
|
|
|
|
|
|
|
\ === Integer Arithmetic ===
|
|
|
|
|
|
|
|
: 1+ 1 + ;
|
|
|
|
: 1- 1 - ;
|
|
|
|
|
2021-01-01 12:01:29 +01:00
|
|
|
\ ( a b -- (a mod b) (a / b) )
|
|
|
|
: /mod 2dup mod -rot / ;
|
2021-01-01 10:37:41 +01:00
|
|
|
|
|
|
|
\ ( n -- -n )
|
2021-01-01 12:01:29 +01:00
|
|
|
: negate 0 swap - ;
|
|
|
|
|
|
|
|
\ ( n1 -- n2 )
|
|
|
|
: not false = ;
|
|
|
|
|
|
|
|
: > swap < ;
|
|
|
|
: <= > not ;
|
|
|
|
: >= < not ;
|
|
|
|
: <> = not ;
|
|
|
|
|
|
|
|
: 0= 0 = ;
|
|
|
|
: 0<> 0 <> ;
|
|
|
|
: 0< 0 < ;
|
|
|
|
: 0> 0 > ;
|
|
|
|
: 0<= 0 <= ;
|
|
|
|
: 0>= 0 >= ;
|
|
|
|
|
|
|
|
\ ( a b c -- (a<=c & c<b) )
|
|
|
|
: within tuck > -rot <= and ;
|
|
|
|
|
|
|
|
\ === Conditional Branch ===
|
|
|
|
\ <condition> if <if-true> then
|
|
|
|
\ <condition> if <if-true> else <if-false> then
|
|
|
|
\ <condition> unless <if-false> then
|
|
|
|
\ <condition> unless <if-false> else <if-true> then
|
|
|
|
|
|
|
|
\ compile: ( -- orig )
|
|
|
|
\ runtime: ( n -- )
|
|
|
|
: if
|
|
|
|
compile 0branch
|
|
|
|
here @ 0 , \ save location of offset, fill dummy
|
|
|
|
; immediate
|
|
|
|
|
|
|
|
\ compile: ( orig -- )
|
|
|
|
\ runtime: ( -- )
|
|
|
|
: then
|
|
|
|
here @ \ ( orig dest )
|
|
|
|
over - \ ( orig offset )
|
|
|
|
swap ! \ fill offset to orig
|
|
|
|
; immediate
|
|
|
|
|
|
|
|
\ compile: ( orig1 -- orig2 )
|
|
|
|
\ runtime: ( -- )
|
|
|
|
: else
|
|
|
|
compile branch
|
|
|
|
here @ 0 , \ save location of offset, fill dummy
|
|
|
|
swap
|
|
|
|
\ fill offset, here-orig1, to orig1
|
|
|
|
here @
|
|
|
|
over -
|
|
|
|
swap !
|
|
|
|
; immediate
|
|
|
|
|
|
|
|
\ compile: ( -- orig )
|
|
|
|
\ runtime: ( n -- )
|
|
|
|
: unless
|
|
|
|
compile not
|
|
|
|
[compile] if
|
|
|
|
; immediate
|
|
|
|
|
|
|
|
\ === Loops ===
|
|
|
|
\ begin <body> <condition> until
|
|
|
|
\ begin <body> again
|
|
|
|
\ begin <condition> while <body> repeat
|
|
|
|
|
|
|
|
\ compile: ( -- dest )
|
|
|
|
\ runtime: ( -- )
|
|
|
|
: begin
|
|
|
|
here @ \ save location
|
|
|
|
; immediate
|
|
|
|
|
|
|
|
\ compile: ( dest -- )
|
|
|
|
\ runtime: ( n -- )
|
|
|
|
: until
|
|
|
|
compile 0branch
|
|
|
|
here @ - , \ fill offset
|
|
|
|
; immediate
|
|
|
|
|
|
|
|
\ compile: ( dest -- )
|
|
|
|
\ runtime: ( -- )
|
|
|
|
: again
|
|
|
|
compile branch
|
|
|
|
here @ - , \ fill offset
|
|
|
|
; immediate
|
|
|
|
|
|
|
|
\ compile: ( dest -- dest orig )
|
|
|
|
\ runtime: ( n -- )
|
|
|
|
\ dest=location of begin
|
|
|
|
\ orig=location of while
|
|
|
|
: while
|
|
|
|
compile 0branch
|
|
|
|
here @ 0 , \ save location, fill dummy
|
|
|
|
; immediate
|
|
|
|
|
|
|
|
\ compile: ( dest orig -- )
|
|
|
|
\ runtime: ( -- )
|
|
|
|
\ dest=location of begin
|
|
|
|
\ orig=location of while
|
|
|
|
: repeat
|
|
|
|
swap
|
|
|
|
compile branch
|
|
|
|
here @ - , \ fill offset from here to begin
|
|
|
|
here @ over - swap ! \ backfill offset from while to here
|
|
|
|
; immediate
|
|
|
|
|
2021-01-01 12:11:47 +01:00
|
|
|
\ === Recursive Call ===
|
2021-01-01 10:37:41 +01:00
|
|
|
|
2021-01-01 12:18:45 +01:00
|
|
|
\ recursive call.
|
|
|
|
\ compiles xt of current definition
|
2021-01-01 12:11:47 +01:00
|
|
|
: recurse
|
|
|
|
latest @ >cfa ,
|
|
|
|
; immediate
|
2021-01-01 10:37:41 +01:00
|
|
|
|
2021-01-01 12:35:09 +01:00
|
|
|
\ === Multiline Comment ===
|
|
|
|
|
|
|
|
: '(' [ key ( ] literal ;
|
|
|
|
: ')' [ key ) ] literal ;
|
|
|
|
|
|
|
|
: (
|
|
|
|
1 \ depth counter
|
|
|
|
begin
|
|
|
|
key
|
|
|
|
dup '(' = if
|
|
|
|
drop 1+ \ increase depth
|
|
|
|
else
|
|
|
|
')' = if
|
|
|
|
1- \ decrease depth
|
|
|
|
then
|
|
|
|
then
|
|
|
|
dup 0= until
|
|
|
|
drop
|
|
|
|
; immediate
|
2021-01-01 12:18:45 +01:00
|
|
|
|
2021-01-01 12:35:09 +01:00
|
|
|
(
|
|
|
|
Now we can use multiline comment with ( nests. )
|
|
|
|
)
|
2021-01-01 12:18:45 +01:00
|
|
|
|
2020-12-31 15:47:37 +01:00
|
|
|
bye
|