forked from kragen/stoneknifeforth
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathtinyboot.py
executable file
·284 lines (226 loc) · 7.27 KB
/
tinyboot.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
#!/usr/bin/python
# -*- coding: utf-8 -*-
"""Tiny bootstrapping interpreter for the first bootstrap stage.
Implements an extremely minimal Forth-like language, used to write
tinyboot1.tbf1.
The theory is that first we ‘compile’ the program by reading through
it to find compile-time definitions and actions, which sets up the
initial state of memory; then we ‘run’ the program by directly
interpreting its text, given that initial state.
"""
import sys, cgitb
cgitb.enable(format='text')
def debug(text):
sys.stderr.write(text + "\n")
start_address = None
memory = [] # a list of bytes represented as integers
stack = []
rstack = []
### Compile-time actions.
# Note that these should leave program_counter pointing after the last
# byte they consume, i.e. they should eat_byte the last byte they
# consume.
program_counter = 0
def current_byte():
return program[program_counter]
def eat_byte():
global program_counter
current_byte = program[program_counter]
program_counter += 1
return current_byte
def advance_past_whitespace():
while program_counter < len(program) and current_byte() in ' \n':
eat_byte()
def advance_to_whitespace():
while program_counter < len(program) and current_byte() not in ' \n':
eat_byte()
def get_token():
advance_past_whitespace()
# XXX and on EOF?
rv = current_byte()
if rv not in "0123456789'": advance_to_whitespace()
return rv
def eat_comment():
comment_start = program_counter
while eat_byte() != ')': pass
jump_targets[comment_start] = program_counter
def push_dataspace_label(n):
return lambda: stack.append(n)
def define(name, action):
assert name not in run_time_dispatch, name
run_time_dispatch[name] = action
def dataspace_label():
"Define a label in data space."
name = get_token()
define(name, push_dataspace_label(len(memory)))
def call_function(n):
def rv():
global program_counter
rstack.append(program_counter)
program_counter = n
return rv
def define_function():
name = get_token()
define(name, call_function(program_counter))
def read_number():
start = program_counter
while eat_byte() in '0123456789': pass
return int(program[start:program_counter])
def literal_byte():
advance_past_whitespace()
memory.append(read_number())
def as_bytes(num):
"Convert a 32-byte number into a little-endian byte sequence."
return [num & 255, num >> 8 & 255, num >> 16 & 255, num >> 24 & 255]
def literal_word():
"Compile a little-endian literal 32-byte number into data space."
advance_past_whitespace()
memory.extend(as_bytes(read_number()))
def allocate_space():
advance_past_whitespace()
memory.extend([0] * read_number())
def set_start_address():
global start_address
start_address = program_counter
def nop(): pass
def skip_literal_byte():
eat_byte() # skip the '
eat_byte() # skip the character itself
# We have to find the backwards jump targets for loops while scanning
# forward. Otherwise we’d have to find them by scanning backwards,
# and you can’t correctly skip comments that way, since comments don’t
# nest.
jump_targets = {}
def start_conditional():
stack.append(program_counter)
def end_conditional():
jump_targets[stack.pop()] = program_counter
start_loop = start_conditional
def end_loop():
jump_targets[program_counter] = stack.pop()
compile_time_dispatch = {
'(': eat_comment,
'v': dataspace_label,
':': define_function,
'b': literal_byte,
'#': literal_word,
'*': allocate_space,
'^': set_start_address,
'[': start_conditional, ']': end_conditional,
'{': start_loop, '}': end_loop,
' ': eat_byte, '\n': eat_byte,
"'": skip_literal_byte,
}
for digit in '0123456789': compile_time_dispatch[digit] = read_number
def tbfcompile():
while program_counter < len(program):
token = get_token()
if token in compile_time_dispatch:
compile_time_dispatch[token]()
elif token in run_time_dispatch:
pass # ignore things from run-time for now
else:
excerpt_beginning = max(0, program_counter - 30)
assert False, '%r not defined at %r' % \
(token, program[excerpt_beginning:program_counter])
# To ensure the loop test condition hits the EOF instead of
# get_token() choking on it:
advance_past_whitespace()
### Run-time actions.
# Execution should pretty much stay inside of functions, and we
# shouldn't run into any compile-time actions there, right?
def write_out():
"Given an address and a count, write out some memory to stdout."
count = stack.pop()
address = stack.pop()
debug('writing address %d, count %d' % (address, count))
sys.stdout.write(''.join([chr(memory[ii])
for ii in range(address, address+count)]))
def quit():
sys.exit(0)
def subtract():
x = stack.pop()
stack.append((stack.pop() - x) & 0xFfffFfff)
def push_literal():
stack.append(read_number())
def decode(bytes):
rv = bytes[0] | bytes[1] << 8 | bytes[2] << 16 | bytes[3] << 24
if rv > 0x7fffFfff:
rv -= 0x100000000
return rv
def fetch():
addr = stack.pop()
stack.append(decode(memory[addr:addr+4]))
def extend_memory(addr):
# Addresses > 100k are probably just a bug; it’s not practical to
# run large programs with this interpreter anyway.
if len(memory) < addr + 1 and addr < 100000:
memory.extend([0] * (addr + 1 - len(memory)))
def store():
addr = stack.pop()
extend_memory(addr)
memory[addr:addr+4] = as_bytes(stack.pop())
def store_byte():
addr = stack.pop()
extend_memory(addr)
memory[addr] = stack.pop() & 255
def less_than():
b = stack.pop()
a = stack.pop()
if a < b:
stack.append(1)
else:
stack.append(0)
def return_from_function():
global program_counter
program_counter = rstack.pop()
def read_byte():
byte = sys.stdin.read(1)
if byte == '':
stack.append(-1)
else:
stack.append(ord(byte))
def jump():
global program_counter
program_counter = jump_targets[program_counter]
def conditional():
if stack.pop(): return
jump()
def loop():
if not stack.pop(): return
jump()
def literal_byte():
# you put 'A into your program to get 65, or 'B to get 66, etc.
eat_byte() # to skip the '
stack.append(ord(eat_byte()))
run_time_dispatch = {
'(': jump,
'W': write_out,
'G': read_byte,
'Q': quit,
'-': subtract,
'<': less_than,
'@': fetch,
'!': store,
# 'f': fetch_byte, not yet needed
's': store_byte,
';': return_from_function,
'[': conditional, ']': nop,
'{': nop, '}': loop,
' ': nop, '\n': nop,
"'": literal_byte,
}
for digit in '0123456789': run_time_dispatch[digit] = push_literal
def tbfrun():
assert start_address is not None
global program_counter
program_counter = start_address
while True:
run_time_dispatch[get_token()]()
def main(infile):
global program
program = infile.read()
tbfcompile()
tbfrun()
assert False, "tbfrun returned"
if __name__ == '__main__': main(file(sys.argv[1]))