-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathVGAXS.cpp
267 lines (255 loc) · 8.75 KB
/
VGAXS.cpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
#include "VGAXS.h"
//HSYNC pin used by TIMER2
#define HSYNCPIN 3
//These two pin cannot be modified without modify the HSYNC assembler code
#define COLORPIN0 6
#define COLORPIN1 7
//VSYNC pin used by TIMER1. Can be 9 or 10
#define VSYNCPIN 9
//Number of VGA lines to be skipped (black lines)
/*These lines includes the vertical sync pulse and back porch.
Minimum value must be 35 (calculate from Nick Gammon)
You can modify this value to center the framebuffer vertically, or not*/
#define SKIPLINES 45
//number of visible lines, after SKIPLINES
#define RENDERLCOUNT 359
static byte afreq, afreq0;
unsigned vtimer;
static byte aline, rlinecnt;
static byte vskip;
byte vgaxfb[VGAX_HEIGHT*VGAX_BWIDTH];
//VSYNC interrupt
ISR(TIMER1_OVF_vect) {
aline=-1;
vskip=SKIPLINES;
vtimer++;
rlinecnt=0;
}
//HSYNC interrupt
ISR(TIMER2_OVF_vect) {
/*
NOTE: I prefer to generate the line here, inside the interrupt.
Gammon's code generate the line pixels inside main().
My versin generate the signal using only interrupts, so inside main() function
you can do anything you want. Your code will be interrupted when VGA signal
needs to be generated
*/
//generate audio modulation. around 15 clocks
asm volatile( //4c to load Z and Y
" ld r16, Z \n\t" //c1 r16=afreq
" cpi %[freq0], 0 \n\t" //c1 afreq0==0 ?
" breq no_audio \n\t" //c1/2 *0
"play_audio: \n\t"
" cpi r16, 0 \n\t" //c1 afreq==0 ?
" brne dont_flip_audio_pin \n\t" //c1/2 *1
"flip_audio_pin: \n\t"
" ldi r18, 1 \n\t" //c1
" out %[audiopin], r18 \n\t" //c1
" st Z, %[freq0] \n\t" //c1 afreq=afreq0
" rjmp end \n\t" //c2
//" mov r16, %[freq0]\n\r"
//" dec r16\n\r"
"no_audio: \n\t"
" nop \n\t" //c1
" nop \n\t" //c1
" nop \n\t" //c1
//" nop \n\t" //c1
" nop \n\t" //c1
" nop \n\t" //c1
" nop \n\t" //c1
" rjmp end \n\t" //c2
"dont_flip_audio_pin: \n\t"
" dec r16 \n\t" //c1
" st Z, r16 \n\t" //c1
//" nop \n\t" //c1
"end: \n\t"
:
: "z" (&afreq),
[freq0] "r" (afreq0),
[audiopin] "i" _SFR_IO_ADDR(PINC)
: "r16", "r18");
//check vertical porch
if (vskip) {
vskip--;
return;
}
if (rlinecnt<60) {
//interrupt jitter fix (needed to keep signal stable)
//code from https://github.com/cnlohr/avrcraft/tree/master/terminal
//modified from 4 nop align to 8 nop align
#define DEJITTER_OFFSET 1
#define DEJITTER_SYNC -3
asm volatile(
" lds r16, %[timer0] \n\t" //
//" add r16, %[toffset] \n\t" //
" subi r16, %[tsync] \n\t" //
" andi r16, 7 \n\t" //
" call TL \n\t" //
"TL: \n\t" //
" pop r31 \n\t" //
" pop r30 \n\t" //
" adiw r30, (LW-TL-5) \n\t" //
" add r30, r16 \n\t" //
//" adc r31, __zero_reg__ \n\t" //
" ijmp \n\t" //
"LW: \n\t" //
" nop \n\t" //
" nop \n\t" //
" nop \n\t" //
" nop \n\t" //
" nop \n\t" //
" nop \n\t" //
" nop \n\t" //
//" nop \n\t" //
"LBEND: \n\t" //
:
: [timer0] "i" (&TCNT0),
[toffset] "i" ((uint8_t)DEJITTER_OFFSET),
[tsync] "i" ((uint8_t)DEJITTER_SYNC)
: "r30", "r31", "r16", "r17");
/*
Output all pixels.
NOTE: My trick here is to unpack 4 pixels and shift them before writing to
PORTD.
Pixels are packed as 0b11223344 because the first pixel write have no time
to perform a shift (ld, out) and must be prealigned to the two upper bits
of PORTD, where the two wires of the VGA DSUB are connected. The second,
the third and the forth pixels are shifted left using mul opcode instead
of a left shift opcode. Shift opcodes are slow and can shift only 1 bit at
a time, using 1 clock cycle. mul is faster.
Instead of using a loop i use the .rept assembler directive to generate an
unrolled loop of 30 iterations.
*/
asm volatile (
".rept 126 \n\t" // right offset (invisible area)
" nop \n\t" //
".endr \n\t" //
" ldi r20, 4 \n\t" //const for <<2bit
".rept 30 \n\t" //output 4 pixels for each iteration
" ld r16, Z+ \n\t" //
" out %[port], r16 \n\t" //write pixel 1
" nop \n\t" //
" nop \n\t" //
" nop \n\t" //
" mul r16, r20 \n\t" //<<2
" out %[port], r0 \n\t" //write pixel 2
" nop \n\t" //
" nop \n\t" //
" nop \n\t" //
" mul r0, r20 \n\t" //<<4
" out %[port], r0 \n\t" //write pixel 3
" nop \n\t" //
" nop \n\t" //
" nop \n\t" //
" mul r0, r20 \n\t" //<<6
" out %[port], r0 \n\t" //write pixel 4
" nop \n\t" //
" nop \n\t" //
" nop \n\t" //
".endr \n\t" //
" nop \n\t" //expand last pixel
" ldi r16, 0 \n\t" //
" out %[port], r16 \n\t" //write black for next pixels
:
: [port] "I" (_SFR_IO_ADDR(PORTD)),
"z" "I" (/*rline*/(byte*)vgaxfb + rlinecnt*VGAX_BWIDTH)
: "r16", "r17", "r20", "r21", "memory"
);
//increment framebuffer line counter after 2 VGA lines
if (++aline==2) {
aline=-1;
rlinecnt++;
}
}
}
void VGAX::begin(bool enableTone) {
//Timers setup code, modified version of the Nick Gammon's VGA sketch
cli();
//setup audio pin
if (enableTone) {
pinMode(A0, OUTPUT);
}
//disable TIMER0 interrupt
TIMSK0=0;
TCCR0A=0;
TCCR0B=1; //enable 16MHz counter (used to fix the HSYNC interrupt jitter)
OCR0A=0;
OCR0B=0;
TCNT0=0;
//TIMER1 - vertical sync pulses
pinMode(VSYNCPIN, OUTPUT);
TCCR1A=bit(WGM11) | bit(COM1A1);
TCCR1B=bit(WGM12) | bit(WGM13) | bit(CS12) | bit(CS10); //1024 prescaler
ICR1=259; //16666 / 64 uS=260 (less one)
OCR1A=0; //64 / 64 uS=1 (less one)
TIFR1=bit(TOV1); //clear overflow flag
TIMSK1=bit(TOIE1); //interrupt on overflow on TIMER1
//TIMER2 - horizontal sync pulses
pinMode(HSYNCPIN, OUTPUT);
TCCR2A=bit(WGM20) | bit(WGM21) | bit(COM2B1); //pin3=COM2B1
TCCR2B=bit(WGM22) | bit(CS21); //8 prescaler
OCR2A=127; //63.6 / 0.5 uS=128 (less one)
// OCR2A=63; //32 / 0.5 uS=64 (less one)
OCR2B=7; //4 / 0.5 uS=8 (less one)
TIFR2=bit(TOV2); //clear overflow flag
TIMSK2=bit(TOIE2); //interrupt on overflow on TIMER2
//pins for outputting the colour information
pinMode(COLORPIN0, OUTPUT);
pinMode(COLORPIN1, OUTPUT);
sei();
}
void VGAX::end() {
//disable TIMER0
TCCR0A=0;
TCCR0B=0;
//disable TIMER1
TCCR1A=0;
TCCR1B=0;
//disable TIMER2
TCCR2A=0;
TCCR2B=0;
}
void VGAX::clear(byte color) {
register byte c=color;
c&=3;
register byte c0=(c*4) | c;
c0|=c0*16;
unsigned cnt=VGAX_BSIZE;
byte *o=(byte*)vgaxfb;
while (cnt--)
*o++=c0;
}
void VGAX::copy(byte *src) {
byte *o=(byte*)vgaxfb;
unsigned cnt=VGAX_BSIZE;
while (cnt--)
*o++=pgm_read_byte(src++);
}
void VGAX::fillrect(byte x, byte y, byte width, byte height, byte color) {
byte rh=height;
while (rh--) {
byte rw=width, rx=x;
while (rw--) {
if (rx<VGAX_WIDTH && y<VGAX_HEIGHT)
putpixel(rx, y, color);
rx++;
}
y++;
}
}
void VGAX::tone(unsigned int frequency) {
//HSYNC=32usec
// afreq=1000000 / frequency / 2 / 32;
afreq=1000000 / frequency / 2 / 64;
afreq0=afreq;
}
void VGAX::noTone() {
afreq0=0;
}
void VGAX::delay(int msec) {
while (msec--) {
unsigned cnt=16000/32; //TODO: use a more precise way to calculate cnt
while (cnt--)
asm volatile("nop\nnop\nnop\nnop\n");
}
}