forked from brooke/mandel-6502
Compare commits
90 commits
| Author | SHA1 | Date | |
|---|---|---|---|
| 6479cf530c | |||
| 29cd3d968f | |||
| b46e6fb343 | |||
| f2a6af0995 | |||
| 96e0356e57 | |||
| fab2760394 | |||
| fd954da47e | |||
| 4bac47a4fd | |||
| 5cf64970c8 | |||
|
|
f7082ab371 | ||
|
|
689363d083 | ||
| 89b4e45901 | |||
| 6e66145ec6 | |||
| 07db3d00d7 | |||
| 26d612b6f3 | |||
| 25da81c64b | |||
| d182d33b35 | |||
| e0cc704d99 | |||
| 7c04862d70 | |||
| 918d15e813 | |||
| eaa00a055a | |||
| 7e5ca79d9a | |||
| d2bf77dc26 | |||
| 582ddf497f | |||
| d157fe1306 | |||
| dcf5a3f59e | |||
| 837082cf56 | |||
| 65fcb44934 | |||
| c424f1b8bc | |||
| 49fe315529 | |||
| f1ebb21bcb | |||
| 87caa52543 | |||
| d8601bb856 | |||
| 7985ea9a39 | |||
| cc83c76706 | |||
| 2e8893fd78 | |||
| 81bf7f3c43 | |||
| 1e0f577e09 | |||
| d2f41f9644 | |||
| 2fcb30b76a | |||
| 13257309dc | |||
| 7184b8e03f | |||
| 4a1e35699a | |||
| 0d086a179c | |||
| 61eb1aaf21 | |||
| b56dc1e98b | |||
| 0a7293d8bc | |||
| ec42f672d4 | |||
| 67649d4743 | |||
| ed79c80b16 | |||
| e6cbe0bc6b | |||
| 6db8cef82d | |||
| 9b7f6b8937 | |||
| 3bd9b1ac31 | |||
| 63e74d5152 | |||
| 14125a398a | |||
| 71d8d93abc | |||
| 64a6cf50f3 | |||
| 100c0f3314 | |||
| e51aa91e4e | |||
| c4b98c7be2 | |||
| 70d2c91f03 | |||
| acac5a8df4 | |||
| 883f926e57 | |||
| 0c63430dd9 | |||
| 3ab5006aa3 | |||
| f903272335 | |||
| 8ad996981a | |||
| 15fc5367f9 | |||
| 2118890977 | |||
| 0fc5ba914f | |||
| 2b0167226e | |||
| 504457595a | |||
| 0fcf4d6676 | |||
| d83b811444 | |||
| f32cc5fa7c | |||
| 052a19b6aa | |||
| 83cba4afa3 | |||
| ee1c268705 | |||
| e84a990789 | |||
| 0cde31905e | |||
| 45c5a4cb2d | |||
| 34ce9da030 | |||
| a9d551a98d | |||
| 829d2860e8 | |||
| f996c3cbcd | |||
| 405cec6d51 | |||
| 05133aabdd | |||
| 7f2bc43cff | |||
| 5637783529 |
6 changed files with 1365 additions and 435 deletions
6
Makefile
6
Makefile
|
|
@ -2,8 +2,8 @@
|
||||||
|
|
||||||
all : mandel.xex
|
all : mandel.xex
|
||||||
|
|
||||||
mandel.xex : mandel.o tables.o
|
mandel.xex : mandel.o tables.o atari-asm-xex.cfg
|
||||||
ld65 -C ./atari-asm-xex.cfg -o $@ $+
|
ld65 -C ./atari-asm-xex.cfg --mapfile mandel.map -o $@ mandel.o tables.o
|
||||||
|
|
||||||
%.o : %.s
|
%.o : %.s
|
||||||
ca65 -o $@ $<
|
ca65 -o $@ $<
|
||||||
|
|
@ -15,4 +15,6 @@ clean :
|
||||||
rm -f tables.s
|
rm -f tables.s
|
||||||
rm -f *.o
|
rm -f *.o
|
||||||
rm -f *.xex
|
rm -f *.xex
|
||||||
|
rm -f mandel.map
|
||||||
|
|
||||||
|
|
||||||
|
|
|
||||||
28
atari-asm-xex.cfg
Normal file
28
atari-asm-xex.cfg
Normal file
|
|
@ -0,0 +1,28 @@
|
||||||
|
FEATURES {
|
||||||
|
STARTADDRESS: default = $2E00;
|
||||||
|
}
|
||||||
|
SYMBOLS {
|
||||||
|
__STARTADDRESS__: type = export, value = %S;
|
||||||
|
}
|
||||||
|
MEMORY {
|
||||||
|
ZP: file = "", define = yes, start = $0082, size = $007E;
|
||||||
|
MAIN: file = %O, define = yes, start = %S, size = $4000 - %S;
|
||||||
|
# Keep $4000-7fff clear for expanded RAM access window
|
||||||
|
TABLES: file = %O, define = yes, start = $8000, size = $a000 - $8000;
|
||||||
|
# Keep $a000-$bfff clear for BASIC cartridge
|
||||||
|
}
|
||||||
|
FILES {
|
||||||
|
%O: format = atari;
|
||||||
|
}
|
||||||
|
FORMATS {
|
||||||
|
atari: runad = start;
|
||||||
|
}
|
||||||
|
SEGMENTS {
|
||||||
|
ZEROPAGE: load = ZP, type = zp, optional = yes;
|
||||||
|
EXTZP: load = ZP, type = zp, optional = yes; # to enable modules to be able to link to C and assembler programs
|
||||||
|
CODE: load = MAIN, type = rw, define = yes;
|
||||||
|
RODATA: load = MAIN, type = ro optional = yes;
|
||||||
|
DATA: load = MAIN, type = rw optional = yes;
|
||||||
|
BSS: load = MAIN, type = bss, optional = yes, define = yes;
|
||||||
|
TABLES: load = TABLES, type = ro, optional = yes, align = 256;
|
||||||
|
}
|
||||||
25
readme.md
25
readme.md
|
|
@ -14,32 +14,37 @@ Non-goals:
|
||||||
|
|
||||||
Enjoy! I'll probably work on this off and on for the next few weeks until I've got it producing fractals.
|
Enjoy! I'll probably work on this off and on for the next few weeks until I've got it producing fractals.
|
||||||
|
|
||||||
-- brooke, january 2023 - february 2024
|
-- brooke, january 2023 - december 2024
|
||||||
|
|
||||||
## Current state
|
## Current state
|
||||||
|
|
||||||
Basic rendering is functional, but no interactive behavior (zoom/pan) or benchmarking is done yet.
|
Basic rendering is functional, with interactive zoom/pan (+/-/arrows) and 6 preset viewports via the number keys.
|
||||||
|
|
||||||
The 16-bit signed integer multiplication works; it takes two 16-bit inputs and emits one 32-bit output in the zero page, using the Atari OS ROM's floating point registers as workspaces. Inputs are clobbered.
|
The 16-bit signed integer multiplication takes two 16-bit inputs and emits one 32-bit output in the zero page, using the Atari OS ROM's floating point registers as workspaces. Inputs are clobbered.
|
||||||
|
|
||||||
The main loop is a basic add-and-shift, using 16-bit adds which requires flipping the sign of negative inputs (otherwise you'd have to add all those sign-extension bits). Runs in 470-780 cycles depending on input.
|
* 16-bit multiplies are decomposed into 4 8-bit unsigned multiplies and some addition
|
||||||
|
* an optimized case for squares uses a table of 8-bit squares to reduce the number of 8-bit multiplication sub-ops
|
||||||
|
* when expanded RAM is available as on 130XE, a 64KB 8-bit multiplication table accelerates the remaining multiplications
|
||||||
|
* without expanded RAM, a table of half-squares is used to implement the algorithm from https://everything2.com/title/Fast+6502+multiplication
|
||||||
|
|
||||||
The mandelbrot calculations are done using 4.12-precision fixed point numbers. It may be possible to squish this down to 3.13.
|
The mandelbrot calculations are done using 3.13-precision fixed point numbers with 6.26-precision intermediates.
|
||||||
|
|
||||||
Iterations are capped at 255.
|
Iterations are capped at 255.
|
||||||
|
|
||||||
The pixels are run in a progressive layout to get the basic shape on screen faster.
|
The pixels are run in a progressive layout to get the basic shape on screen faster.
|
||||||
|
|
||||||
## Next steps
|
There is a running counter of ms/px using the vertical blank interrupts as a timer, used to track our progress. :D
|
||||||
|
|
||||||
Add a running counter of ms/px using the vertical blank interrupts as a timer. This'll show how further work improves it!
|
There's a check for cycles in (zx,zy) output when in the 'lake'; if values repeat, they cannot escape. This is a big time saver in fractint.
|
||||||
|
|
||||||
Check for cycles in (zx,zy) output when in the 'lake'; if values repeat, they cannot escape. This is a big time saver in fractint.
|
There's some cute color cycling.
|
||||||
|
|
||||||
I may be able to do a faster multiply using tables of squares for 8-bit component multiplication.
|
|
||||||
|
|
||||||
## Deps and build instructions
|
## Deps and build instructions
|
||||||
|
|
||||||
I'm using `ca65` as a macro assembler, and have a Unix-style `Makefile` for building. Should work fairly easily on Linux and Mac. Might work on "raw" Windows but I use WSL for that.
|
I'm using `ca65` as a macro assembler, and have a Unix-style `Makefile` for building. Should work fairly easily on Linux and Mac. Might work on "raw" Windows but I use WSL for that.
|
||||||
|
|
||||||
Currently produces a `.xex` executable, which can be booted up in common Atari emulators and some i/o devices.
|
Currently produces a `.xex` executable, which can be booted up in common Atari emulators and some i/o devices.
|
||||||
|
|
||||||
|
## Todo
|
||||||
|
|
||||||
|
See ideas in `todo.md`.
|
||||||
|
|
|
||||||
23
tables.js
23
tables.js
|
|
@ -11,23 +11,40 @@ function db(func) {
|
||||||
return lines.join('\n');
|
return lines.join('\n');
|
||||||
}
|
}
|
||||||
|
|
||||||
|
let squares = [];
|
||||||
|
for (let i = 0; i < 512; i++) {
|
||||||
|
squares.push(Math.trunc((i * i + 1) / 2));
|
||||||
|
}
|
||||||
|
|
||||||
console.log(
|
console.log(
|
||||||
`.segment "TABLES"
|
`.segment "TABLES"
|
||||||
|
|
||||||
.export mul_lobyte256
|
.export mul_lobyte256
|
||||||
.export mul_hibyte256
|
.export mul_hibyte256
|
||||||
.export mul_hibyte512
|
.export mul_hibyte512
|
||||||
|
.export sqr_lobyte
|
||||||
|
.export sqr_hibyte
|
||||||
|
|
||||||
|
; (i * i + 1) / 2 for the multiplier
|
||||||
.align 256
|
.align 256
|
||||||
mul_lobyte256:
|
mul_lobyte256:
|
||||||
${db((x) => Math.round(x * x / 2) & 0xff)}
|
${db((i) => squares[i] & 0xff)}
|
||||||
|
|
||||||
.align 256
|
.align 256
|
||||||
mul_hibyte256:
|
mul_hibyte256:
|
||||||
${db((x) => (Math.round(x * x / 2) >> 8) & 0xff)}
|
${db((i) => (squares[i] >> 8) & 0xff)}
|
||||||
|
|
||||||
.align 256
|
.align 256
|
||||||
mul_hibyte512:
|
mul_hibyte512:
|
||||||
${db((x) => (Math.round((x + 256) * (x + 256) / 2) >> 8) & 0xff)}
|
${db((i) => (squares[i + 256] >> 8) & 0xff)}
|
||||||
|
|
||||||
|
; (i * i) for the plain squares
|
||||||
|
.align 256
|
||||||
|
sqr_lobyte:
|
||||||
|
${db((i) => (i * i) & 0xff)}
|
||||||
|
|
||||||
|
.align 256
|
||||||
|
sqr_hibyte:
|
||||||
|
${db((i) => ((i * i) >> 8) & 0xff)}
|
||||||
|
|
||||||
`);
|
`);
|
||||||
|
|
|
||||||
17
todo.md
Normal file
17
todo.md
Normal file
|
|
@ -0,0 +1,17 @@
|
||||||
|
things to try:
|
||||||
|
|
||||||
|
* fix status bar to show elapsed time, per-iter time, per-pixel iter count
|
||||||
|
|
||||||
|
* 'turbo' mode disabling graphics in full or part
|
||||||
|
|
||||||
|
* patch the entire expanded-ram imul8xe on top of imul8 to avoid the 3-cycle thunk penalty :D
|
||||||
|
|
||||||
|
* maybe clean up the load/layout of the big mul table
|
||||||
|
|
||||||
|
* consider alternate lookup tables in the top 16KB under ROM
|
||||||
|
|
||||||
|
* y-axis mirror optimization
|
||||||
|
|
||||||
|
* extract viewport for display & re-input via keyboard
|
||||||
|
|
||||||
|
* fujinet screenshot/viewport uploader
|
||||||
Loading…
Add table
Add a link
Reference in a new issue