xe #1
2 changed files with 29 additions and 48 deletions
76
imul8xe.s
76
imul8xe.s
|
@ -3,55 +3,38 @@ PORTB = $d301
|
||||||
|
|
||||||
|
|
||||||
EXTENDED_RAM = $4000 ; 16KiB bank on the XE
|
EXTENDED_RAM = $4000 ; 16KiB bank on the XE
|
||||||
bankswitch = ; ???
|
|
||||||
|
|
||||||
; input in X/Y (lo/hi)
|
; lookup table for top byte -> PORTB value for bank-switch
|
||||||
; output in FR0
|
.align 256
|
||||||
; clobbers FR0
|
bankswitch:
|
||||||
; 128 cycles
|
.repeat 256, i
|
||||||
proc imul8xe
|
.byte ((i & $c0) >> 5) | $c1
|
||||||
output = FR0
|
.endrepeat
|
||||||
ptr = FR0 + 2
|
|
||||||
|
|
||||||
lda #0 ; 2 cyc
|
; 58-77 cycles
|
||||||
sta ptr ; 3 cyc
|
.macro imul8xe dest, arg1, arg2
|
||||||
sta ptr + 1 ; 3 cyc
|
.local done
|
||||||
|
.local output
|
||||||
|
.local ptr
|
||||||
|
|
||||||
|
output = dest
|
||||||
|
ptr = dest + 2 ; scratch space assumed
|
||||||
|
|
||||||
; bottom 14 bits except the LSB are the per-bank table index
|
; bottom 14 bits except the LSB are the per-bank table index
|
||||||
; add $4000 for the bank pointer
|
; add $4000 for the bank pointer
|
||||||
txa ; 2 cyc
|
lda arg1 ; 3 cyc
|
||||||
and #$fe ; 2 cyc
|
and #$fe ; 2 cyc
|
||||||
sta ptr ; 3 cyc
|
sta ptr ; 3 cyc
|
||||||
tya ; 2 cyc
|
lda arg2 ; 3 cyc
|
||||||
and #$3f ; 2 cyc
|
and #$3f ; 2 cyc
|
||||||
clc ; 2 cyc
|
clc ; 2 cyc
|
||||||
adc #$40 ; 2 cyc
|
adc #$40 ; 2 cyc
|
||||||
sta ptr + 1 ; 3 cyc
|
sta ptr + 1 ; 3 cyc
|
||||||
|
|
||||||
; top 2 bits are the table bank selector
|
; top 2 bits are the table bank selector
|
||||||
tya ; 2 cyc
|
ldx arg2 ; 3 cyc
|
||||||
and #$c0 ; 2 cyc
|
lda bank_switch,x ; 4 cyc
|
||||||
; shift in extended RAM mode 2x 1 bits
|
sta PORTB ; 4 cyc
|
||||||
sec ; 2 cyc
|
|
||||||
ror ; 2 cyc
|
|
||||||
ror ; 2 cyc
|
|
||||||
; shift in 0 bits
|
|
||||||
asr ; 2 cyc
|
|
||||||
asr ; 2 cyc
|
|
||||||
asr ; 2 cyc
|
|
||||||
|
|
||||||
; save the second param for later
|
|
||||||
phy ; 3 cyc
|
|
||||||
|
|
||||||
; disable interrupts
|
|
||||||
lda NMIEN ; 4 cyc
|
|
||||||
pha ; 3 cyc
|
|
||||||
lda #0 ; 2 cyc
|
|
||||||
sta NMIEN ; 4 cyc
|
|
||||||
|
|
||||||
; set the standard top RAM and OS ROM on
|
|
||||||
or #$81 ; 2 cyc
|
|
||||||
sta PORTB ; 4 cyc
|
|
||||||
|
|
||||||
|
|
||||||
; copy the entry into output
|
; copy the entry into output
|
||||||
|
@ -62,22 +45,21 @@ proc imul8xe
|
||||||
lda (ptr),y ; 5 cyc
|
lda (ptr),y ; 5 cyc
|
||||||
sta output+1 ; 3 cyc
|
sta output+1 ; 3 cyc
|
||||||
|
|
||||||
; restore memory
|
; note: we are not restoring memory to save 6 cycles!
|
||||||
lda #$81 ; 2 cyc
|
; this means those 16kb have to be switched back to base RAM
|
||||||
sta PORTB ; 4 cyc
|
; if we need to use them anywhere else
|
||||||
|
;;; restore memory
|
||||||
; restore interrupts
|
;;lda #$81 ; 2 cyc - disabled
|
||||||
pla ; 3 cyc
|
;;sta PORTB ; 4 cyc - disabled
|
||||||
sta NMIEN ; 4 cyc
|
|
||||||
|
|
||||||
; check that 1 bit we skipped to fit into space
|
; check that 1 bit we skipped to fit into space
|
||||||
txa ; 2 cyc
|
lda arg1 ; 3 cyc
|
||||||
and $#1 ; 2 cyc
|
and $#1 ; 2 cyc
|
||||||
beq done ; 2 cyc
|
beq done ; 2 cyc
|
||||||
|
|
||||||
; add the second param one last tie for the skipped bit
|
; add the second param one last tie for the skipped bit
|
||||||
clc ; 2 cyc
|
clc ; 2 cyc
|
||||||
pla ; 3 cyc
|
lda arg2 ; 3 cyc
|
||||||
adc output ; 3 cyc
|
adc output ; 3 cyc
|
||||||
sta output ; 3 cyc
|
sta output ; 3 cyc
|
||||||
lda #0 ; 2 cyc
|
lda #0 ; 2 cyc
|
||||||
|
@ -85,9 +67,7 @@ proc imul8xe
|
||||||
sta output+1 ; 3 cyc
|
sta output+1 ; 3 cyc
|
||||||
|
|
||||||
done:
|
done:
|
||||||
pla
|
.endmacro
|
||||||
rts ; 6 cyc
|
|
||||||
endproc
|
|
||||||
|
|
||||||
proc imul8xe_init
|
proc imul8xe_init
|
||||||
rts
|
rts
|
||||||
|
|
1
mandel.s
1
mandel.s
|
@ -373,6 +373,7 @@ fill_masks:
|
||||||
.local next
|
.local next
|
||||||
.local small_product
|
.local small_product
|
||||||
; circa 92 cycles? this doesn't seem right
|
; circa 92 cycles? this doesn't seem right
|
||||||
|
; 81-92 cycles
|
||||||
.scope
|
.scope
|
||||||
mul_factor_a = arg1
|
mul_factor_a = arg1
|
||||||
mul_factor_x = arg2
|
mul_factor_x = arg2
|
||||||
|
|
Loading…
Reference in a new issue