-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathbr-subleq.s
executable file
·443 lines (386 loc) · 12.9 KB
/
br-subleq.s
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
; BeamRacer SUBLEQ Virtual Machine
;
; Maciej 'YTM/Elysium' Witkowiak, 2021
;
NTSC_LAST_SAFE_LINE = 259
NTSC_LINE_COUNT = 263
PAL_LAST_SAFE_LINE = 307
.include "vlib/vasyl.s"
sei
lda #<irq_handler
sta $314
lda #>irq_handler
sta $315
cli
jsr knock_knock
jsr copy_and_activate_dlist
@keyloop:
jsr $ffe4 ; check if key pressed
beq @keyloop
; stop VASYL and restore IRQ vector
lda #0
sta $d031
sei
lda #$31
sta $314
lda #$ea
sta $315
cli
rts
irq_handler:
lda $d019
and #%00010000
beq not_vasyl_irq
sta $d019 ; ack VASYL IRQ
lda VREG_PORT0 ; get the character to print
inc VREG_DLISTL ; release VASYL from spinlock, as it is ok to run concurrently from now on
jsr $FFD2 ; CHROUT
jmp $ea81 ; pull regs from the stack and RTI
not_vasyl_irq:
jmp $ea31 ; original IRQ routine
; Once VASYL enters a spinlock, only 6510 can stop it from spinning by
; incrementing VREG_DLISTL by one. Otherwise it will spin for an arbitrary amount of time
; (including across multiple frames).
.macro SPINLOCK
MOV VREG_DLISTL, <spinlock ; potential race, so do not use just before frame's end
MOV VREG_DLISTH, >spinlock
MOV $d021, 2
.if (* - dl_start) & $ff = $ff ; if spinlock would fall on a page's last byte
VNOP ; we insert a dummy NOP to prevent that.
.endif
spinlock:
MOV VREG_DLSTROBE, $a7 ; spin, baby, spin ; $a7 is VNOP, which we get pointed to
; once DLISTL is incremented
SKIP
WAIT NTSC_LAST_SAFE_LINE, 0
BRA safe_to_update ; we are still before NTSC's last safe line, and so also before PAL's.
WAIT NTSC_LINE_COUNT, 0 ; this only completes on PAL, so an NTSC machine will restart (at spinlock+1)
SKIP
WAIT PAL_LAST_SAFE_LINE, 0
BRA safe_to_update ; we're on PAL and still before last safe line.
END ; wait for the next frame
safe_to_update:
MOV VREG_DLISTL, <dl_restart
MOV VREG_DLISTH, >dl_restart
.endmacro
.include "vlib/vlib.s"
.segment "VASYL"
;; instruction action:
;; [b] <- [b]-[a] = -[a]+[b]; if b<=0 then goto 0
;; instruction encoding:
;; (address to jump to when result negative or zero - c) (address to jump to when result positive) (address of a) (address of b (result))
dl_start:
; enable reading from both ports, we're in bank0, DL enabled
MOV VREG_CONTROL, %00011000 ; this can be done from C64 setup
; start of vm program
MOV VREG_ADR0, <vm_start ; this can be done from C64 setup
MOV VREG_ADR0+1, >vm_start
; make DL restart at dl_restart so that program continues in the new frame
MOV VREG_DLISTL, <dl_restart
MOV VREG_DLISTH, >dl_restart
MOV VREG_DLIST2L, <mainloop
MOV VREG_DLIST2H, >mainloop
MOV $d01a, %00010000 ; enable VASYL interrupts
WAIT 300, 0 ; this WAIT can only complete on PAL - subsequent instructions won't be executed on an NTSC machine.
MOV VREG_ADR1, <(frame_end+1)
MOV VREG_ADR1+1, >(frame_end+1)
MOV VREG_PORT1, <PAL_LAST_SAFE_LINE ; default frame-end marker suitable for PAL
END
character_out:
MOV $d021, 7
IRQ
MOV VREG_ADR0, $ff
MOV VREG_ADR0+1, $ff
SPINLOCK
MOV $d021,6
BRA char_out_done
; comparator checks if both lo- and hi-byte are equal to $ff.
comparator:
comparator_addr:
MOV VREG_STEP0, 0 ; low byte
MOV VREG_ADR0, <(iocheck_table+$80)
MOV VREG_ADR0+1, >(iocheck_table+$80)
MOV VREG_ADR1, <(comparator_addr2+1)
MOV VREG_ADR1+1, >(comparator_addr2+1)
XFER VREG_STEP1, (0)
XFER VREG_PORT1, (0)
VNOP ; one waitcycle needed for the write above to land
comparator_addr2:
SETA 0 ; this will be modified
DECA
BRA back_from_comparator
comparator_addr3:
MOV VREG_STEP0, 0 ; hi byte
MOV VREG_ADR0, <(iocheck_table+$80)
MOV VREG_ADR0+1, >(iocheck_table+$80)
MOV VREG_ADR1, <(comparator_addr4+1)
MOV VREG_ADR1+1, >(comparator_addr4+1)
XFER VREG_STEP1, (0)
XFER VREG_PORT1, (0)
VNOP ; one waitcycle needed for the write above to land
comparator_addr4:
SETA 0 ; this will be modified
DECA
char_out_done:
BRA back_from_comparator
BRA character_out
comparator_trampoline:
BRA comparator
dl_restart: ;; new frame starts here
MOV $20, 2 ;; indicator start
mainloop: ;; new instruction processing starts here
MOV VREG_STEP0, 1
MOV VREG_STEP1, 2 ;; skip 2 bytes - over next opcode for all self-modifying writes
MOV VREG_ADR1, <(pcleq+1)
MOV VREG_ADR1+1, >(pcleq+1)
XFER VREG_PORT1, (0) ;; lo byte of new PC (if neq), branch after DECA taken
XFER VREG_PORT1, (0) ;; hi byte of new PC (if neq), branch after DECA taken
MOV VREG_ADR1, <(pcpos+1)
MOV VREG_ADR1+1, >(pcpos+1)
XFER VREG_PORT1, (0) ;; lo byte of new PC (if positive), branch after DECA not taken, just address of the next instruction
XFER VREG_PORT1, (0) ;; hi byte of new PC (if positive), branch after DECA not taken, just address of the next instruction
;; copy address of [a] into place where [a] will be read
MOV VREG_ADR1, <(addr1+1)
MOV VREG_ADR1+1, >(addr1+1)
XFER VREG_PORT1, (0) ;; lo byte of [a]
XFER VREG_PORT1, (0) ;; hi byte of [a]
;; copy address of [b] into three places: to read value to be negated and to store result of [b]-[a]
MOV VREG_STEP0, 0
MOV VREG_STEP1, 0
MOV VREG_ADR1, <(addr2+1)
MOV VREG_ADR1+1, >(addr2+1)
XFER VREG_PORT1, (0) ;; lo byte of [b]
MOV VREG_ADR1, <(addr2_2+1)
MOV VREG_ADR1+1, >(addr2_2+1)
XFER VREG_PORT1, (0) ;; lo byte of [b]
MOV VREG_ADR1, <(comparator_addr+1)
MOV VREG_ADR1+1, >(comparator_addr+1)
MOV VREG_STEP0, 1 ; advance after next read
XFER VREG_PORT1, (0) ;; lo byte of [b]
MOV VREG_STEP0, 0
MOV VREG_ADR1, <(addr2+1+2)
MOV VREG_ADR1+1, >(addr2+1+2)
XFER VREG_PORT1, (0) ;; hi byte of [b]
MOV VREG_ADR1, <(addr2_2+1+2)
MOV VREG_ADR1+1, >(addr2_2+1+2)
XFER VREG_PORT1, (0) ;; hi byte of [b]
MOV VREG_ADR1, <(comparator_addr3 + 1)
MOV VREG_ADR1+1, >(comparator_addr3 + 1)
XFER VREG_PORT1, (0) ;; hi byte of [b]
;; read value from [a], put as step 0 to be negated
addr1:
MOV VREG_ADR0, 0 ; this will be modified
MOV VREG_ADR0+1, 0 ; this will be modified
MOV VREG_ADR1, <(addrval_a+1)
MOV VREG_ADR1+1, >(addrval_a+1)
XFER VREG_PORT1, (0)
;; put value from [a] in $ffff for possible use by the 6510
MOV VREG_ADR1, $ff
MOV VREG_ADR1+1, $ff
XFER VREG_PORT1, (0)
BRA comparator_trampoline
back_from_comparator:
MOV VREG_STEP0, 0
MOV VREG_STEP1, 0
addr2:
;; read value from [b], put as step 0 into add/sign table offsets
;; (step0,1 must be still set to 0, we read the value twice)
MOV VREG_ADR0, 0 ; this will be modified
MOV VREG_ADR0+1, 0 ; this will be modified
MOV VREG_ADR1, <(addrval_b+1)
MOV VREG_ADR1+1, >(addrval_b+1)
XFER VREG_PORT1, (0)
MOV VREG_ADR1, <(addrval_b2+1)
MOV VREG_ADR1+1, >(addrval_b2+1)
XFER VREG_PORT1, (0)
;; first indexed read - what is -[a]? put it into addrval_aneg2 and addrval_aneg as step0 values
MOV VREG_ADR0, <(negtable+$80) ; middle of the table, position of 0
MOV VREG_ADR0+1, >(negtable+$80) ; middle of the table, position of 0
MOV VREG_ADR1, <(addrval_aneg+1)
MOV VREG_ADR1+1, >(addrval_aneg+1)
addrval_a:
MOV VREG_STEP0, 0 ; this will be set to value from [a]
XFER VREG_PORT1, (0) ; read once and advance port0 by [a], but step1 is still 0
MOV VREG_STEP0, 0 ; don't advance now, we need this value twice
XFER VREG_PORT1, (0) ; read -[a] and store at addrval_aneg
MOV VREG_ADR1, <(addrval_aneg2+1)
MOV VREG_ADR1+1, >(addrval_aneg2+1)
XFER VREG_PORT1, (0) ; read -[a] and store at addrval_aneg2
;; is [b]-[a]>0?
MOV VREG_STEP1, 0 ; PORT1 will be written thrice, we only want to know last value
MOV VREG_ADR0, <(signtable+$100) ; middle of the table, position of '0'
MOV VREG_ADR0+1, >(signtable+$100) ; middle of the table, position of '0'
MOV VREG_ADR1, <(setaval+1)
MOV VREG_ADR1+1, >(setaval+1)
addrval_aneg:
MOV VREG_STEP0, 0 ; step here will be -[a] value (-128,127)
XFER VREG_PORT1, (0) ; read value at 0, move from 0 to -[a] value
addrval_b:
MOV VREG_STEP0, 0 ; step here will be [b] value (-128,127)
XFER VREG_PORT1, (0) ; read value at -[a], move from -[a] to [b] value
XFER VREG_PORT1, (0) ; finally read sign of subtraction result - 0 to skip BRA or <>0 to run BRA
;; what is the actual value [b]-[a]?
MOV VREG_STEP1, 0 ; PORT1 will be written thrice, we only want to know last value
MOV VREG_ADR0, <(addtable+$100) ; middle of the table, position of '0'
MOV VREG_ADR0+1, >(addtable+$100) ; middle of the table, position of '0'
addr2_2:
;; store result in b
MOV VREG_ADR1, 0 ; this will be modified
MOV VREG_ADR1+1, 0 ; this will be modified
addrval_aneg2:
MOV VREG_STEP0, 0 ; step here will be -[a] value (-128,127)
XFER VREG_PORT1, (0) ; read value at 0, move from 0 to -[a] value
addrval_b2:
MOV VREG_STEP0, 0 ; step here will be [b] value (-128,127)
XFER VREG_PORT1, (0) ; read value at -[a], move from -[a] to [b] value
XFER VREG_PORT1, (0) ; finally read subtraction result, store at addr2
setaval:
SETA 0 ; this will be modified
DECA ; if A==0 branch will not be taken, when [a]>[b]
BRA pcleq ; branch if A<>0
pcpos:
MOV VREG_ADR0, 0 ; branch not taken, take next instruction
MOV VREG_ADR0+1, 0
BRA pcrun
pcleq:
MOV VREG_ADR0, 0 ; branch taken
MOV VREG_ADR0+1, 0
pcrun:
d020_val:
MOV $20, 6 ; debug indicator
SKIP
frame_end:
WAIT NTSC_LAST_SAFE_LINE,0 ; default frame-end marker suitable for NTSC
MOV VREG_DL2STROBE, 0
MOV $20, 15 ; we have no time for processing next instruction, end this DL run
END
signtable:
; table with sign information, (1=negative or 0, 0=positive)
; note: first/last 128 bytes indicate +/- overflow, in add table they are (respectively) positive/negative, should this be consistent with information here as well?
.repeat 256 ; negative numbers
.byte 1
.endrepeat
.byte 1 ; zero
.repeat 255 ; positive numbers
.byte 0
.endrepeat
addtable:
; table for adding numbers, index by offset from the middle
.repeat 256, I
.byte I
.endrepeat
.repeat 256, I
.byte I
.endrepeat
negtable:
; table for negating numbers, index by offset from the middle
.repeat 128, I
.byte 128-I
.endrepeat
.repeat 128, I
.byte <(-I)
.endrepeat
iocheck_table:
.repeat 127
.byte 1
.endrep
.byte 0
.repeat 128
.byte 1
.endrep
; subleq program encoding
; <negative-jmp> <positive-jmp> <a> <b>; [b]<-[b]-[a]; if [b]-[a]<=0 then [negative-jmp] else [positive-jmp]
.macro subleq addr_a, addr_b, jump_c
.ifblank addr_a
.error "SUBLEQ: first argument required for subleq macro"
.endif
.ifnblank jump_c
.word jump_c ; where to jump if negative
.else
.word :+ ; if ommited then point to the next instruction
.endif
.word :+ ; link to next instruction (required for VASYL, not existing in pure Subleq)
.word addr_a ; [a]
.ifnblank addr_b
.word (addr_b & $ffff) ; [b], [b]<-[b]-[a] ;; "& $ffff" enables negative values
.else
.word addr_a ; if 2nd argument is omitted reuse [a]
.endif
:
.endmacro
vm_start:
; subleq program starts here, addresses must be absolute, not relative to vm_start
; debug cases for jumps:
; subleq three, seven, sloop ; 7-3=4 4>=0 so no jump to sloop, infinite loop with no visuals
; subleq seven, three, sloop ; 3-7=-4 4<0 so jump to sloop, infinite loop with visuals
; subleq seven, seven, sloop ; 7-7=0, 0=0 so jump to sloop, infinite loop with visuals
;: subleq zero, zero, :- ; infinite loop with no visuals
; debug cases for arithmetics
subleq three, seven ; 7-3=4, seven=4
subleq two, isseven ; 0-2=-2, isseven=-2
subleq isseven, five ; 5-(-2)=5+2=7, five=7
subleq isseven ; zero-out location isseven
subleq negone, three ; 3-(-1)=4, three=4
; Following code only works by lucky coincidence - just the lo-bytes of ptrs need to be adjusted.
; We need 16-bit arithmetics!
print_hello:
subleq char_counter
terminator_check:
subleq zero, hello_txt, ploop
printer:
subleq hello_txt, -1
subleq negone, terminator_check+6
subleq negone, printer+4
subleq negone, char_counter
subleq zero, zero, terminator_check
ploop:
; restore start pointer
subleq char_counter, terminator_check+6
subleq char_counter, printer+4
subleq one, d020_val+1 ; visual feedback
subleq zero, zero, print_hello ; jmp to beginning
sloop: ; infinite loop that changes border color by modifying display list directly
.word sloop, sloop, one, d020_val+1
subleq zero, zero, sloop ; infinite loop
: .word :-, :-, zero, zero ; this is also infinite loop
; subleq data space - memory, constants, registers, variables
zero: .byte 0 ; literal 0
seven: .byte 7
three: .byte 3
one: .byte 1
two: .byte 2
five: .byte 5
isseven: .byte 0
negone: .byte $ff
hello_txt: .byte "vasyl says hello!", $0d, 0
char_counter: .byte 0
; all the exports for debug purposes
; vpeek(seven) should be 4
; vpeek(isseven) should be 0
; vpeek(five) sohuld be 7
.export signtable
.export addtable
.export negtable
.export vm_start
.export zero
.export seven
.export three
.export two
.export five
.export isseven
.export dl_start
.export dl_restart
.export mainloop
.export pcleq
.export pcpos
.export addr1
.export addr2
.export addr2_2
.export addrval_a
.export addrval_aneg
.export addrval_aneg2
.export addrval_b
.export addrval_b2
.export setaval
.export d020_val
.export iocheck_table