1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
|
@ ScummVM Scumm Interpreter
@ Copyright (C) 2007 The ScummVM project
@
@ This program is free software@ you can redistribute it and/or
@ modify it under the terms of the GNU General Public License
@ as published by the Free Software Foundation@ either version 2
@ of the License, or (at your option) any later version.
@
@ This program is distributed in the hope that it will be useful,
@ but WITHOUT ANY WARRANTY; without even the implied warranty of
@ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
@ GNU General Public License for more details.
@
@ You should have received a copy of the GNU General Public License
@ along with this program@ if not, write to the Free Software
@ Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
@
@ $URL: https://scummvm.svn.sourceforge.net/svnroot/scummvm/scummvm/trunk/engines/scumm/gfxARM.s $
@ $Id: gfxARM.s 29646 2007-11-26 16:54:56Z fingolfin $
@
@ @author Robin Watts (robin@wss.co.uk)
.text
.global ClassicProc3RendererShadowARM
.equ _scaleIndexY , 112
.equ _numStrips , 108
.equ _palette , 104
.equ _shadow_table , 100
.equ _scaleIndexX , 96
.equ _scaleX , 92
.equ _height , 88
.equ store_r14 , 84
.equ store_r11 , 80
.equ store_r10 , 76
.equ store_r9 , 72
.equ store_r8 , 68
.equ store_r7 , 64
.equ store_r6 , 60
.equ store_r5 , 56
.equ store_r4 , 52
.equ src , 48
.equ height , 44
.equ len , 40
.equ v1_shr , 36
.equ v1_skip_width , 32
.equ v1_destptr , 28
.equ v1_scaleXstep , 24
.equ v1_mask_ptr , 20
.equ v1_y , 16
.equ v1_scaletable , 12
.equ pitch , 8
.equ scaleIdxXPtr , 4
.equ scaleIdxYPtr , 0
.equ space , 48
@ r0 = _scaleY
@ r1 = v1
@ r2 = _out
@ r3 = src
@ <> = _height
@ <> = _scaleX
@ <> = _scaleIndexX
@ <> = _shadow_table
@ <> = _palette
@ <> = _numstrips
@ <> = _scaleIndexY
ClassicProc3RendererShadowARM:
@ shadow20 = false
@ shadowed = true
@ unscaled = false
STMFD r13!,{r3-r11,r14}
LDRH r6,[r2,#2]
LDRH r7,[r2] @ r7 = _out.w
LDRH r8,[r2,#4] @ r8 = _out.pitch
ADD r6,r6,#1 @ r6 = _out.h+1
SUB r13,r13,#space
STR r3,[r13,#src]
STR r8,[r13,#pitch]
LDMIA r1,{r3,r4,r5,r8,r9,r10,r11}
@ r3 = v1.x
@ r4 = v1.y
@ r5 = scaletable
@ r8 = skip_width
@ r9 = destptr
@ r10= mask_ptr
@ r11= scaleXstep
LDR r2, [r13,#_scaleIndexY]
LDR r12,[r13,#_scaleIndexX]
STR r4, [r13,#v1_y]
STR r5, [r13,#v1_scaletable]
ADD r2, r5,r2 @ r2 = &scaletable[_scaleIndexY]
ADD r5, r5,r12 @ r5 = &scaletable[_scaleIndexX]
STR r5, [r13,#scaleIdxXPtr]
STR r2, [r13,#scaleIdxYPtr]
STR r8, [r13,#v1_skip_width]
LDRB r8, [r1,#29] @ r8 = shr
LDRB r14,[r1,#31] @ r14= replen
LDRB r1, [r1,#30] @ r1 = repcolor
STR r8, [r13,#v1_shr]
STR r9, [r13,#v1_destptr]
STR r10,[r13,#v1_mask_ptr]
STR r11,[r13,#v1_scaleXstep]
LDR r12,[r13,#_height]
@ r0 = _scaleY
@ r1 = v1.repcolor
@ r2 = &v1.scaletable[scaleIndexY]
@ r3 = v1.x
@ r4 = v1.y
@ r5 =
@ r6 = _out.h+1
@ r7 = _out.w
@ r8 =
@ r9 = v1.destptr
@ r10= v1.mask_ptr
@ r11=
@ r12= _height
@ r14= v1.replen
MOV r8,#0x80
AND r11,r3,#7 @ r11= v1.x & 7
MOV r8,r8,LSR r11 @ r8 = maskbit = revBitMask(v1.x & 7)
ADD r10,r10,r3,ASR #3 @ r10= mask = v1.mask_ptr + (v1.x>>3)
@ r0 = _scaleY
@ r1 = color = v1.repcolor
@ r2 = &v1.scaletable[scaleIndexY]
@ r3 = v1.x
@ r4 = y = v1.y
@ r5 =
@ r6 = _out.h+1
@ r7 = _out.w
@ r8 = maskbit
@ r9 = v1.destptr
@ r10= mask
@ r11=
@ r12= height = _height
@ r14= len = v1.replen
CMP r14,#0
BEQ outerloop
ADD r12,r12,#1 @ r12= height++
MOV r5,r12 @ r5 = loopCount = height
CMP r5,r14 @ if (loopCount > len)
MOVGT r5,r14 @ loopCount = len
SUB r12,r12,r5
SUB r14,r14,r5
STR r12,[r13,#height]
STR r14,[r13,#len]
LDR r12,[r13,#pitch]
B startpos
outerloop:
@ r0 = _scaleY
@ r1 = color
@ r2 = &v1.scaletable[scaleIndexY]
@ r3 = x
@ r4 = y
@ r5 =
@ r6 = _out.h+1
@ r7 = _out.w
@ r8 = maskbit
@ r9 = dst
@ r10= mask
@ r11=
@ r12= height
@ r14=
LDR r11,[r13,#src]
LDR r5,[r13,#v1_shr]
@ stall
LDRB r14,[r11],#1 @ r14= len = *src++
@ stall
@ stall
MOV r1, r14,LSR r5 @ r1 = color = len>>v1.shr
BICS r14,r14,r1,LSL r5 @ r14= len
LDREQB r14,[r11],#1 @ if (!len) r14 = len = *src++
STR r11,[r13,#src]
middleloop:
@ r0 = _scaleY
@ r1 = color
@ r2 = &v1.scaletable[scaleIndexY]
@ r3 = x
@ r4 = y
@ r5 = loopCount = min(height,len)
@ r6 = _out.h+1
@ r7 = _out.w
@ r8 = maskbit
@ r9 = dst
@ r10= mask
@ r11=
@ r12= height
@ r14= len
MOV r5,r12 @ loopCount = height
CMP r5,r14 @ if (loopCount > len)
MOVGT r5,r14 @ loopCount = len
SUB r12,r12,r5 @ height -= loopCount
SUB r14,r14,r5 @ len -= loopCount
STR r12,[r13,#height]
STR r14,[r13,#len]
LDR r11,[r13,#_numStrips]
LDR r12,[r13,#pitch]
@ r0 = _scaleY
@ r1 = color
@ r2 = &v1.scaletable[scaleIndexY]
@ r3 = x
@ r4 = y
@ r5 = loopCount = min(height,len)
@ r6 = _out.h+1
@ r7 = _out.w
@ r8 = maskbit
@ r9 = dst
@ r10= mask
@ r11= _numStrips
@ r12= _out.pitch
@ r14= scratch
innerloop:
@ inner loop
CMP r0,#254 @ if _scaleY <= 254
LDRLEB r14,[r2],#1 @ r14 = v1.scaletable[scaleIndexY++]
@ stallLE
@ stallLE
CMPLE r0,r14 @ || _scaleY >= r14
BLE startpos
LDRB r14,[r10],r11 @ r14 = mask[0] mask += _numStrips
ADDS r4,r4,#1 @ y >= 0 (equiv to y>-1,y+1>0)
CMPGT r1,#0 @ && color > 0
CMPGT r6,r4 @ && _out.h+1 > y+1
CMNGT r3,#1 @ && x >= 0 (equiv to x>-1,x+1>0)
CMPGT r7,r3 @ && _out.w > x
BLE masked
TST r14,r8 @ && !(mask[0] && maskbit)
LDREQ r14,[r13,#_palette]
BNE masked
@ stall
LDRB r14,[r14,r1] @ r14 = pcolor = _palette[color]
@ stall
@ stall
CMP r14,#13 @ if (pcolor == 13)
LDREQ r12,[r13,#_shadow_table]
LDREQB r14,[r9] @ r14 = *dst
@ stallEQ
@ stallEQ
LDREQB r14,[r12,r14] @ r14 = pcolor=_shadow_tab[r14]
LDREQ r12,[r13,#pitch]
@ stallEQ
STRB r14,[r9] @ *dst = pcolor
masked:
ADD r9,r9,r12 @ dst += _out.pitch
startpos:
SUBS r5,r5,#1 @ loopCount -=1
BNE innerloop
@ So we either ran out of height or len (or both)
LDR r12,[r13,#height]
LDR r14,[r13,#len]
CMP r12,#0
BNE notheight
LDR r10,[r13,#v1_skip_width]
LDR r11,[r13,#_scaleX]
LDR r2,[r13,#scaleIdxXPtr]
LDR r12,[r13,#v1_scaleXstep]
SUBS r10,r10,#1 @ if --v1.skip_width == 0
BEQ end @ return _scaleIndexX
LDRB r9,[r2],r12 @ r2 = scaleIdxXPtr+=sclXstp
STR r10,[r13,#v1_skip_width]
CMP r11,#254 @ if _scaleX <= 254
CMPLE r11,r9 @ && _scaleX <= scltb[scIdxX]
LDR r9,[r13,#v1_destptr] @ r9 = dst = v1.destptr
BLE noXstep
SUB r11,r7,#1
ADDS r3,r3,r12 @ v1.x += v1.scaleXstep
@ if v1.x < 0 ||
CMPGE r11,r3 @ _out.w-1 < v1.x
BLT end
AND r11,r3,#7
MOV r8,#0x80
MOV r8,r8,LSR r11 @ maskbit = revBitMask(v1.x & 7)
ADD r9,r9,r12 @ r10 = v1.destptr += v1.scaleXstep
STR r9,[r13,#v1_destptr]
noXstep:
STR r2,[r13,#scaleIdxXPtr]
LDR r10,[r13,#v1_mask_ptr]
LDR r12,[r13,#_height] @ r12= height = _height
LDR r4,[r13,#v1_y] @ r4 = y = v1.y
LDR r2,[r13,#scaleIdxYPtr] @ r2 = v1.scaletable[sclIdxY]
ADD r10,r10,r3,ASR #3 @ mask=v1.mask_ptr+(v1.x>>3)
notheight:
CMP r14,#0 @ while (len > 0)
BGT middleloop
B outerloop @ while (1)
end:
LDR r0,[r13,#v1_scaletable]
SUB r0,r2,r0
ADD r13,r13,#space
LDMFD r13!,{r3-r11,PC}
|