diff options
author | David Guillen Fandos | 2021-03-15 02:25:02 +0100 |
---|---|---|
committer | David Guillen Fandos | 2021-03-15 02:25:02 +0100 |
commit | c86b9064df021a8d619fd0e9fd4d3525cd4a1373 (patch) | |
tree | 7b5b7517b8d36ba0894ee710105e4da3b3017636 /psp | |
parent | 6e9104e1ee0881a9e51e95b8b1d52eb0b612adf4 (diff) | |
download | picogpsp-c86b9064df021a8d619fd0e9fd4d3525cd4a1373.tar.gz picogpsp-c86b9064df021a8d619fd0e9fd4d3525cd4a1373.tar.bz2 picogpsp-c86b9064df021a8d619fd0e9fd4d3525cd4a1373.zip |
Move palettes around to simplify MIPS dynarec
Will move also OAM structures to gain a few cycles per load/store.
Loads can also be optimized for an extra instruction per access.
Diffstat (limited to 'psp')
-rw-r--r-- | psp/mips_stub.S | 60 |
1 files changed, 28 insertions, 32 deletions
diff --git a/psp/mips_stub.S b/psp/mips_stub.S index 2e83064..ed0e370 100644 --- a/psp/mips_stub.S +++ b/psp/mips_stub.S @@ -46,6 +46,8 @@ .global execute_arm_translate .global icache_region_sync .global reg_check +.global palette_ram +.global palette_ram_converted .global memory_map_read .global memory_map_write @@ -2093,18 +2095,15 @@ execute_store_io_u8: execute_store_palette_u8: region_check 5, patch_store_u8 - lui $2, %hi(palette_ram) # start loading palette_ram address (delay) + andi $2, $4, 0x3FE # align palette address ins $5, $5, 8, 8 # double value - andi $4, $4, 0x3FE # align palette address - addu $2, $2, $4 - sh $5, %lo(palette_ram)($2) # palette_ram[address] = value + addu $2, $2, $16 + sh $5, 0x100($2) # palette_ram[address] = value sll $1, $5, 1 # make green 6bits ins $1, $0, 0, 6 # make bottom bit 0 ins $1, $5, 0, 5 # insert red channel into $1 - lui $2, %hi(palette_ram_converted) - addu $2, $2, $4 jr $ra # return - sh $1, %lo(palette_ram_converted)($2) + sh $1, 0x500($2) execute_store_vram_u8: translate_region_vram_store_align16 patch_store_u8 @@ -2193,17 +2192,14 @@ execute_store_io_u16: execute_store_palette_u16: region_check 5, patch_store_u16 - lui $2, %hi(palette_ram) # start loading palette_ram address (delay) - andi $4, $4, 0x3FE # wrap/align palette address - addu $2, $2, $4 - sh $5, %lo(palette_ram)($2) # palette_ram[address] = value + andi $2, $4, 0x3FE # wrap/align palette address + addu $2, $2, $16 + sh $5, 0x100($2) # palette_ram[address] = value sll $1, $5, 1 # make green 6bits ins $1, $0, 0, 6 # make bottom bit 0 ins $1, $5, 0, 5 # insert red channel into $1 - lui $2, %hi(palette_ram_converted) - addu $2, $2, $4 jr $ra # return - sh $1, %lo(palette_ram_converted)($2) + sh $1, 0x500($2) execute_store_vram_u16: translate_region_vram_store_align16 patch_store_u16 @@ -2295,18 +2291,14 @@ execute_store_io_u32: execute_store_palette_u32: region_check 5, patch_store_u32 - lui $2, %hi(palette_ram) # start loading palette_ram address (delay) - andi $4, $4, 0x3FC # wrap/align palette address - addu $2, $2, $4 - sw $5, %lo(palette_ram)($2) # palette_ram[address] = value + andi $2, $4, 0x3FC # wrap/align palette address + addu $2, $2, $16 + sw $5, 0x100($2) # palette_ram[address] = value sll $1, $5, 1 # make green 6bits ins $1, $0, 0, 6 # make bottom bit 0 ins $1, $5, 0, 5 # insert red channel into $1 - lui $2, %hi(palette_ram_converted) - addu $2, $2, $4 - addiu $2, $2, %lo(palette_ram_converted) - sh $1, ($2) + sh $1, 0x500($2) srl $5, $5, 16 # shift down to next palette value sll $1, $5, 1 # make green 6bits @@ -2314,7 +2306,7 @@ execute_store_palette_u32: ins $1, $5, 0, 5 # insert red channel into $1 jr $ra # return - sh $1, 2($2) + sh $1, 0x502($2) execute_store_vram_u32: translate_region_vram_store_align32 patch_store_u32 @@ -2411,18 +2403,14 @@ execute_store_io_u32a: execute_store_palette_u32a: region_check 5, patch_store_u32a - lui $2, %hi(palette_ram) # start loading palette_ram address (delay) - andi $4, $4, 0x3FC # wrap/align palette address - addu $2, $2, $4 - sw $5, %lo(palette_ram)($2) # palette_ram[address] = value + andi $2, $4, 0x3FC # wrap/align palette address + addu $2, $2, $16 + sw $5, 0x100($2) # palette_ram[address] = value sll $1, $5, 1 # make green 6bits ins $1, $0, 0, 6 # make bottom bit 0 ins $1, $5, 0, 5 # insert red channel into $1 - lui $2, %hi(palette_ram_converted) - addu $2, $2, $4 - addiu $2, $2, %lo(palette_ram_converted) - sh $1, ($2) + sh $1, 0x500($2) srl $5, $5, 16 # shift down to next palette value sll $1, $5, 1 # make green 6bits @@ -2430,7 +2418,7 @@ execute_store_palette_u32a: ins $1, $5, 0, 5 # insert red channel into $1 jr $ra # return - sh $1, 2($2) + sh $1, 0x502($2) execute_store_vram_u32a: translate_region_vram_store_align32 patch_store_u32a @@ -2810,6 +2798,7 @@ execute_arm_translate: .data +.align 6 memory_map_read: .space 0x8000 @@ -2819,5 +2808,12 @@ memory_map_read: reg: .space 0x100 +# Placed here for easy access +palette_ram: + .space 0x400 +palette_ram_converted: + .space 0x400 + + memory_map_write: .space 0x8000 |