4 size_mem = 1000000 # 1 mega-int
7 size_RS = 1000 # Return stack size
8 size_PS = 1000 # Parameter stack size
9 size_TIB = 1000 # Terminal input buffer size
11 # The mem array constitutes the memory of the VM. It has the following geography:
13 # mem = +-----------------------+
14 # | Built-in Variables |
15 # +-----------------------+
17 # +-----------------------+
19 # +-----------------------+
20 # | Terminal Input Buffer |
21 # +-----------------------+
23 # +-----------------------+
25 # Note that all words (user-defined, primitive, variables, etc) are included in
28 # Simple linear addressing is used with one exception: references to primitive code
29 # blocks, which are represented as anonymous functions, appear as negative indicies
30 # into the primitives array which contains these functions.
32 mem = Array{Int64,1}(size_mem)
33 primitives = Array{Function,1}()
34 primNames = Array{ASCIIString,1}()
39 RSP0 = nextVarAddr; nextVarAddr += 1
40 PSP0 = nextVarAddr; nextVarAddr += 1
41 HERE = nextVarAddr; nextVarAddr += 1
42 LATEST = nextVarAddr; nextVarAddr += 1
44 mem[RSP0] = nextVarAddr # bottom of RS
45 mem[PSP0] = mem[RSP0] + size_RS # bottom of PS
46 TIB = mem[PSP0] + size_PS # address of terminal input buffer
47 mem[HERE] = TIB + size_TIB # location of bottom of dictionary
48 mem[LATEST] = 0 # no previous definition
50 DICT = mem[HERE] # Save bottom of dictionary as constant
54 RSP::Int64 # Return stack pointer
55 PSP::Int64 # Parameter/data stack pointer
56 IP::Int64 # Instruction pointer
57 W::Int64 # Working register
59 reg = Reg(mem[RSP0], mem[PSP0], 0, 0)
61 # Stack manipulation functions
63 type ParamStackUnderflow <: Exception end
64 type ReturnStackUnderflow <: Exception end
66 Base.showerror(io::IO, ex::ParamStackUnderflow) = print(io, "Parameter stack underflow.")
67 Base.showerror(io::IO, ex::ReturnStackUnderflow) = print(io, "Return stack underflow.")
69 getRSDepth() = reg.RSP - mem[RSP0]
70 getPSDepth() = reg.PSP - mem[PSP0]
72 function ensurePSDepth(depth::Int64)
74 throw(ParamStackUnderflow())
78 function ensureRSDepth(depth::Int64)
80 throw(ReturnStackUnderflow())
84 function pushRS(val::Int64)
96 function pushPS(val::Int64)
97 mem[reg.PSP += 1] = val
108 # Handy functions for adding/retrieving strings to/from memory.
110 getString(addr::Int64, len::Int64) = ASCIIString([Char(c) for c in mem[addr:(addr+len-1)]])
111 function putString(str::ASCIIString, addr::Int64)
112 mem[addr:(addr+length(str)-1)] = [Int64(c) for c in str]
115 # Primitive creation and calling functions
117 function defPrim(f::Function; name="nameless")
119 push!(primNames, replace(replace(name, "\004", "EOF"), "\n", "\\n"))
121 return -length(primitives)
124 callPrim(addr::Int64) = primitives[-addr]()
126 # Word creation functions
128 function createHeader(name::AbstractString, flags::Int64)
129 mem[mem[HERE]] = mem[LATEST]
130 mem[LATEST] = mem[HERE]
133 mem[mem[HERE]] = length(name) | flags; mem[HERE] += 1
134 putString(name, mem[HERE]); mem[HERE] += length(name)
137 function defPrimWord(name::AbstractString, f::Function; flags::Int64=0)
138 createHeader(name, flags)
140 codeWordAddr = mem[HERE]
141 mem[codeWordAddr] = defPrim(f, name=name)
147 function defWord(name::AbstractString, wordAddrs::Array{Int64,1}; flags::Int64=0)
148 createHeader(name, flags)
151 mem[mem[HERE]] = DOCOL
154 for wordAddr in wordAddrs
155 mem[mem[HERE]] = wordAddr
162 # Variable creation functions
164 function defExistingVar(name::AbstractString, varAddr::Int64; flags::Int64=0)
166 defPrimWord(name, eval(:(() -> begin
172 function defNewVar(name::AbstractString, initial::Int64; flags::Int64=0)
173 createHeader(name, flags)
175 codeWordAddr = mem[HERE]
176 varAddr = mem[HERE] + 1
178 mem[mem[HERE]] = DOVAR; mem[HERE] += 1
179 mem[mem[HERE]] = initial; mem[HERE] += 1
181 return varAddr, codeWordAddr
184 function defConst(name::AbstractString, val::Int64; flags::Int64=0)
185 createHeader(name, flags)
187 mem[mem[HERE]] = DOCON; mem[HERE] += 1
188 mem[mem[HERE]] = val; mem[HERE] += 1
193 # Threading Primitives (inner interpreter)
195 NEXT = defPrim(() -> begin
201 DOCOL = defPrim(() -> begin
207 DOVAR = defPrim(() -> begin
212 DOCON = defPrim(() -> begin
213 pushPS(mem[reg.W + 1])
217 EXIT = defPrimWord("EXIT", () -> begin
222 # Dictionary entries for core built-in variables, constants
224 HERE_CFA = defExistingVar("HERE", HERE)
225 LATEST_CFA = defExistingVar("LATEST", LATEST)
226 PSP0_CFA = defExistingVar("PSP0", PSP0)
227 RSP0_CFA = defExistingVar("RSP0", RSP0)
229 defConst("DOCOL", DOCOL)
230 defConst("DOCON", DOCON)
231 defConst("DOVAR", DOVAR)
233 defConst("DICT", DICT)
234 defConst("MEMSIZE", size_mem)
236 F_IMMED = defConst("F_IMMED", 128)
237 F_HIDDEN = defConst("F_HIDDEN", 256)
238 F_LENMASK = defConst("F_LENMASK", 127)
240 # Basic forth primitives
242 DROP = defPrimWord("DROP", () -> begin
247 SWAP = defPrimWord("SWAP", () -> begin
255 DUP = defPrimWord("DUP", () -> begin
261 OVER = defPrimWord("OVER", () -> begin
263 pushPS(mem[reg.PSP-1])
267 ROT = defPrimWord("ROT", () -> begin
277 NROT = defPrimWord("-ROT", () -> begin
288 TWODROP = defPrimWord("2DROP", () -> begin
294 TWODUP = defPrimWord("2DUP", () -> begin
303 TWOSWAP = defPrimWord("2SWAP", () -> begin
315 TWOOVER = defPrimWord("2OVER", () -> begin
324 QDUP = defPrimWord("?DUP", () -> begin
333 INCR = defPrimWord("1+", () -> begin
339 DECR = defPrimWord("1-", () -> begin
345 INCR2 = defPrimWord("2+", () -> begin
351 DECR2 = defPrimWord("2-", () -> begin
357 ADD = defPrimWord("+", () -> begin
364 SUB = defPrimWord("-", () -> begin
371 MUL = defPrimWord("*", () -> begin
378 DIVMOD = defPrimWord("/MOD", () -> begin
387 TWOMUL = defPrimWord("2*", () -> begin
392 TWODIV = defPrimWord("2/", () -> begin
397 EQU = defPrimWord("=", () -> begin
400 pushPS(a==b ? -1 : 0)
404 NEQU = defPrimWord("<>", () -> begin
407 pushPS(a!=b ? -1 : 0)
411 LT = defPrimWord("<", () -> begin
418 GT = defPrimWord(">", () -> begin
425 LE = defPrimWord("<=", () -> begin
428 pushPS(a<=b ? -1 : 0)
432 GE = defPrimWord(">=", () -> begin
435 pushPS(a>=b ? -1 : 0)
439 ZEQU = defPrimWord("0=", () -> begin
440 pushPS(popPS() == 0 ? -1 : 0)
444 ZNEQU = defPrimWord("0<>", () -> begin
445 pushPS(popPS() != 0 ? -1 : 0)
449 ZLT = defPrimWord("0<", () -> begin
450 pushPS(popPS() < 0 ? -1 : 0)
454 ZGT = defPrimWord("0>", () -> begin
455 pushPS(popPS() > 0 ? -1 : 0)
459 ZLE = defPrimWord("0<=", () -> begin
460 pushPS(popPS() <= 0 ? -1 : 0)
464 ZGE = defPrimWord("0>=", () -> begin
465 pushPS(popPS() >= 0 ? -1 : 0)
469 AND = defPrimWord("AND", () -> begin
476 OR = defPrimWord("OR", () -> begin
483 XOR = defPrimWord("XOR", () -> begin
490 INVERT = defPrimWord("INVERT", () -> begin
497 LIT = defPrimWord("LIT", () -> begin
505 STORE = defPrimWord("!", () -> begin
512 FETCH = defPrimWord("@", () -> begin
518 ADDSTORE = defPrimWord("+!", () -> begin
525 SUBSTORE = defPrimWord("-!", () -> begin
535 TOR = defPrimWord(">R", () -> begin
540 FROMR = defPrimWord("R>", () -> begin
545 RFETCH = defPrimWord("R@", () -> begin
550 RSPFETCH = defPrimWord("RSP@", () -> begin
555 RSPSTORE = defPrimWord("RSP!", () -> begin
560 RDROP = defPrimWord("RDROP", () -> begin
567 PSPFETCH = defPrimWord("PSP@", () -> begin
572 PSPSTORE = defPrimWord("PSP!", () -> begin
579 WFETCH = defPrimWord("W@", () -> begin
584 WSTORE = defPrimWord("W!", () -> begin
591 sources = Array{Any,1}()
592 currentSource() = sources[length(sources)]
595 NUMTIB, NUMTIB_CFA = defNewVar("#TIB", 0)
596 TOIN, TOIN_CFA = defNewVar(">IN", 0)
597 EOF = defConst("EOF", 4)
599 KEY = defPrimWord("KEY", () -> begin
600 if mem[TOIN] >= mem[NUMTIB]
603 if !eof(currentSource())
604 line = readline(currentSource())
605 mem[NUMTIB] = length(line)
613 pushPS(mem[TIB + mem[TOIN]])
619 EMIT = defPrimWord("EMIT", () -> begin
624 WORD = defPrimWord("WORD", () -> begin
641 if c == '\n' || c == eof_char
647 if c == ' ' || c == '\t'
657 if c == '\n' || c == eof_char
658 # Treat newline as a special word
660 mem[wordAddr + offset] = Int64(c)
667 mem[wordAddr + offset] = Int64(c)
673 if c == ' ' || c == '\t' || c == '\n' || c == eof_char
688 BASE, BASE_CFA = defNewVar("BASE", 10)
689 NUMBER = defPrimWord("NUMBER", () -> begin
694 s = getString(wordAddr, wordLen)
697 pushPS(parse(Int64, s, mem[BASE]))
700 pushPS(1) # Error indication
706 # Dictionary searches
708 FIND = defPrimWord("FIND", () -> begin
712 word = lowercase(getString(wordAddr, wordLen))
717 while (latest = mem[latest]) > 0
718 lenAndFlags = mem[latest+1]
719 len = lenAndFlags & F_LENMASK
720 hidden = (lenAndFlags & F_HIDDEN) == F_HIDDEN
722 if hidden || len != wordLen
727 thisWord = lowercase(getString(thisAddr, len))
729 if lowercase(thisWord) == lowercase(word)
739 TOCFA = defPrimWord(">CFA", () -> begin
742 lenAndFlags = mem[addr+1]
743 len = lenAndFlags & F_LENMASK
745 pushPS(addr + 2 + len)
750 TODFA = defWord(">DFA", [TOCFA, INCR, EXIT])
754 BRANCH = defPrimWord("BRANCH", () -> begin
755 reg.IP += mem[reg.IP]
759 ZBRANCH = defPrimWord("0BRANCH", () -> begin
761 reg.IP += mem[reg.IP]
771 STATE, STATE_CFA = defNewVar("STATE", 0)
773 HEADER = defPrimWord("HEADER", () -> begin
777 word = getString(wordAddr, wordLen)
779 createHeader(word, 0)
784 COMMA = defPrimWord(",", () -> begin
785 mem[mem[HERE]] = popPS()
791 LBRAC = defPrimWord("[", () -> begin
796 RBRAC = defPrimWord("]", () -> begin
801 HIDDEN = defPrimWord("HIDDEN", () -> begin
803 mem[addr] = mem[addr] $ F_HIDDEN
807 HIDE = defWord("HIDE",
817 LATEST_CFA, FETCH, HIDDEN,
821 SEMICOLON = defWord(";",
823 LATEST_CFA, FETCH, HIDDEN,
825 EXIT], flags=F_IMMED)
827 IMMEDIATE = defPrimWord("IMMEDIATE", () -> begin
828 lenAndFlagsAddr = mem[LATEST] + 1
829 mem[lenAndFlagsAddr] = mem[lenAndFlagsAddr] $ F_IMMED
834 [WORD, FIND, TOCFA, EXIT])
836 BTICK = defWord("[']",
837 [FROMR, DUP, INCR, TOR, FETCH, EXIT])
841 CREATE = defWord("CREATE",
844 LIT, DOVAR, COMMA, EXIT]);
846 DODOES = defPrim(() -> begin
852 defConst("DODOES", DODOES)
854 FROMDOES_PAREN = defWord("(DOES>)",
855 [DODOES, LAST, FETCH, TOCFA, STORE, EXIT])
857 FROMDOES = defWord("DOES>",
858 [BTICK, FROMDOES_PAREN, COMMA, BTICK, EXIT, COMMA,
859 BTICK, LIT, COMMA, LATEST, FETCH, TODFA, COMMA], flags=F_IMMED)
864 LITSTRING = defPrimWord("LITSTRING", () -> begin
874 TELL = defPrimWord("TELL", () -> begin
877 str = getString(addr, len)
884 EXECUTE = defPrimWord("EXECUTE", () -> begin
889 type ParseError <: Exception
890 wordName::ASCIIString
892 Base.showerror(io::IO, ex::ParseError) = print(io, "Parse error at word: '$(ex.wordName)'.")
894 DEBUG, DEBUG_CFA = defNewVar("DEBUG", 0)
896 INTERPRET = defPrimWord("INTERPRET", () -> begin
900 wordName = getString(mem[reg.PSP-1], mem[reg.PSP])
902 println("... ", replace(replace(wordName, "\004", "EOF"), "\n", "\\n"), " ...")
905 callPrim(mem[TWODUP])
908 wordAddr = mem[reg.PSP]
913 isImmediate = (mem[wordAddr+1] & F_IMMED) != 0
916 callPrim(mem[NROT]) # get rid of extra copy of word string details
920 if mem[STATE] == 0 || isImmediate
922 return callPrim(mem[EXECUTE])
924 # Append CFA to dictionary
928 # Not in dictionary, assume number
932 callPrim(mem[NUMBER])
935 throw(ParseError(wordName))
939 # Number already on stack!
941 # Append literal to dictionary
951 QUIT = defWord("QUIT",
956 BYE = defPrimWord("BYE", () -> begin
960 PROMPT = defPrimWord("PROMPT", () -> begin
964 NL = defPrimWord("\n", () -> begin
965 if mem[STATE] == 0 && currentSource() == STDIN
966 callPrim(mem[PROMPT])
971 INCLUDE = defPrimWord("INCLUDE", () -> begin
975 word = getString(wordAddr, wordLen)
977 push!(sources, open(word, "r"))
985 EOF_WORD = defPrimWord("\x04", () -> begin
986 if currentSource() != STDIN
987 close(currentSource())
993 if currentSource() == STDIN
994 callPrim(mem[PROMPT])
1005 CHAR = defPrimWord("CHAR", () -> begin
1009 word = getString(wordAddr, wordLen)
1010 pushPS(Int64(word[1]))
1016 initFileName = nothing
1017 if isfile("lib.4th")
1018 initFileName = "lib.4th"
1019 elseif isfile(Pkg.dir("forth/src/lib.4th"))
1020 initFileName = Pkg.dir("forth/src/lib.4th")
1025 function run(;initialize=true)
1026 # Begin with STDIN as source
1027 push!(sources, STDIN)
1029 global initialized, initFileName
1030 if !initialized && initialize
1031 if initFileName != nothing
1032 print("Including definitions from $initFileName...")
1033 push!(sources, open(initFileName, "r"))
1036 println("No library file found. Only primitive words available.")
1040 # Start with IP pointing to first instruction of outer interpreter
1043 # Primitive processing loop.
1044 # Everyting else is simply a consequence of this loop!
1049 println("Evaluating prim ", jmp," ", primNames[-jmp])
1055 showerror(STDOUT, ex)
1058 while !isempty(sources) && currentSource() != STDIN
1059 close(pop!(sources))
1074 function dump(startAddr::Int64; count::Int64 = 100, cellsPerLine::Int64 = 10)
1075 chars = Array{Char,1}(cellsPerLine)
1077 lineStartAddr = cellsPerLine*div((startAddr-1),cellsPerLine) + 1
1078 endAddr = startAddr + count - 1
1080 q, r = divrem((endAddr-lineStartAddr+1), cellsPerLine)
1081 numLines = q + (r > 0 ? 1 : 0)
1087 for c in 1:cellsPerLine
1088 if i >= startAddr && i <= endAddr
1090 if mem[i]>=32 && mem[i]<128
1091 chars[c] = Char(mem[i])
1103 println("\t", ASCIIString(chars))
1108 count = reg.PSP - mem[PSP0]
1112 for i in (mem[PSP0]+1):reg.PSP
1117 println("Parameter stack empty")
1122 count = reg.RSP - mem[RSP0]
1126 for i in (mem[RSP0]+1):reg.RSP
1131 println("Return stack empty")
1135 DUMP = defPrimWord("DUMP", () -> begin
1139 dump(addr, count=count)