summaryrefslogtreecommitdiff
path: root/apps/codecs/libmad/dct32_arm.S
blob: a4eda8a0878900512cfde20ae3e103f4b8621894 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
/***************************************************************************
 *             __________               __   ___.
 *   Open      \______   \ ____   ____ |  | _\_ |__   _______  ___
 *   Source     |       _//  _ \_/ ___\|  |/ /| __ \ /  _ \  \/  /
 *   Jukebox    |    |   (  <_> )  \___|    < | \_\ (  <_> > <  <
 *   Firmware   |____|_  /\____/ \___  >__|_ \|___  /\____/__/\_ \
 *                     \/            \/     \/    \/            \/
 * $Id$
 *
 * Copyright (C) 2007 by Tomasz Malesinski
 *
 * This program is free software; you can redistribute it and/or
 * modify it under the terms of the GNU General Public License
 * as published by the Free Software Foundation; either version 2
 * of the License, or (at your option) any later version.
 *
 * This software is distributed on an "AS IS" basis, WITHOUT WARRANTY OF ANY
 * KIND, either express or implied.
 *
 ****************************************************************************/

#include "mad_iram.h"

    .global dct32

    .section    ICODE_SECTION_MPA_ARM,"ax",%progbits

dct32:
    stmdb    sp!, {r4-r11, lr}
    sub      sp, sp, #144
    str      r0, [sp, #12]
    str      r1, [sp, #8]
    str      r2, [sp, #4]
    str      r3, [sp]
    add      r0, sp, #16
    add      r1, r0, #128
    ldr      r2, =bitrev
.shuffle:
    ldr      r5, [sp, #12]
    ldr      r3, [r2], #4
    sub      r4, r5, r3, lsl #4
    add      r3, r5, r3, lsl #4
    ldr      r6, [r3]
    ldr      r8, [r4, #124]
    add      r6, r6, r8
    sub      r8, r6, r8, lsl #1
    ldr      r7, [r3, #8]
    ldr      lr, [r4, #116]
    add      r7, r7, lr
    sub      lr, r7, lr, lsl #1
    ldr      r10, [r3, #64]
    ldr      r9, [r4, #60]
    add      r10, r10, r9
    sub      r9, r10, r9, lsl #1
    ldr      r11, [r3, #72]
    ldr      r12, [r4, #52]
    add      r11, r11, r12
    sub      r12, r11, r12, lsl #1
    add      r6, r6, r10
    sub      r10, r6, r10, lsl #1
    add      r7, r7, r11
    sub      r11, r7, r11, lsl #1
    add      r8, r8, r12
    sub      r12, r8, r12, lsl #1
    add      lr, lr, r9
    sub      r9, lr, r9, lsl #1
    stmia    r0!, {r6, r7, r8, r9, r10, r11, r12, lr}
    cmp      r0, r1
    bne      .shuffle
    ldr      r0, =189812531
    add      r1, sp, #16
    add      r3, r1, #128
.l2:
    add      r2, r1, #32
    ldmia    r2, {r4, r5, r8, r9}
    ldmia    r1, {r6, r7, r10, r11}
    add      r6, r6, r4
    sub      r4, r6, r4, lsl #1
    add      r7, r7, r5
    sub      r5, r7, r5, lsl #1
    stmia    r2!, {r4, r5}
    stmia    r1!, {r6, r7}
    add      r9, r9, r8
    sub      r8, r9, r8, lsl #1
    smull    r4, r6, r9, r0
    movs     r4, r4, lsr #28
    adc      r4, r4, r6, lsl #4
    smull    r5, r6, r8, r0
    movs     r5, r5, lsr #28
    adc      r5, r5, r6, lsl #4
    add      r10, r10, r4
    sub      r4, r10, r4, lsl #1
    add      r11, r11, r5
    sub      r5, r11, r5, lsl #1
    stmia    r2!, {r4, r5}
    stmia    r1!, {r10, r11}
    ldmia    r2, {r5, r6, r8, r11}
    ldmia    r1, {r4, r7, r9, r10}
    add      r4, r4, r6
    sub      r6, r4, r6, lsl #1
    add      r7, r7, r5
    sub      r5, r7, r5, lsl #1
    stmia    r2!, {r6, r7}
    stmia    r1!, {r4, r5}
    add      r11, r11, r8
    sub      r8, r11, r8, lsl #1
    smull    r5, r4, r8, r0
    movs     r5, r5, lsr #28
    adc      r5, r5, r4, lsl #4
    smull    r6, r4, r11, r0
    movs     r6, r6, lsr #28
    adc      r6, r6, r4, lsl #4
    add      r9, r9, r5
    sub      r5, r9, r5, lsl #1
    sub      r10, r10, r6
    add      r6, r10, r6, lsl #1
    stmia    r2!, {r5, r6}
    stmia    r1!, {r9, r10}
    add      r1, r1, #32
    cmp      r1, r3
    bne      .l2
    add      r2, sp, #16
    add      r3, r2, #64
    ldr      r0, =sincos
    add      r1, r0, #128
.lbut8:
    ldmia    r3, {r7, r8}
    ldmia    r0, {r9, r10}
    add      r0, r0, #16
    smull    r6, r5, r7, r9
    smlal    r6, r5, r10, r8
    movs     r6, r6, lsr #28
    adc      r6, r6, r5, lsl #4
    smull    r10, r5, r7, r10
    rsb      r9, r9, #0
    smlal    r10, r5, r8, r9
    movs     r10, r10, lsr #28
    adc      r5, r10, r5, lsl #4
    ldmia    r2, {r7, r8}
    add      r7, r7, r5
    sub      r5, r7, r5, lsl #1
    add      r8, r8, r6
    sub      r6, r8, r6, lsl #1
    stmia    r3!, {r5, r6}
    stmia    r2!, {r7, r8}
    cmp      r0, r1
    bne      .lbut8
    add      r1, sp, #16
    ldr      r2, =sincos
    ldr      r3, =sincos2
    ldr      r0, [sp, #8]
    mov      r0, r0, lsl #2
    ldr      r4, [sp, #4]
    add      r4, r4, r0
    ldr      r5, [sp]
    add      r5, r5, #480
    add      r5, r5, r0
    mov      r0, #0
.l4:
    rsb      r12, r0, #16
    and      r12, r12, #15
    add      lr, sp, #16
    add      r12, lr, r12, lsl #3
    ldmia    r1!, {r10, r11}
    ldmia    r12, {r6, r7}
    add      r6, r6, r10
    sub      r10, r6, r10, lsl #1
    add      r11, r11, r7
    sub      r7, r11, r7, lsl #1
    ldmia    r2!, {r12, lr}
    smull    r9, r8, r11, r12
    smlal    r9, r8, lr, r10
    movs     r9, r9, lsr #28
    adc      r9, r9, r8, lsl #4
    smull    lr, r8, r11, lr
    rsb      r12, r12, #0
    smlal    lr, r8, r10, r12
    movs     lr, lr, lsr #28
    adc      r8, lr, r8, lsl #4
    add      r6, r6, r8
    sub      r8, r6, r8, lsl #1
    add      r7, r7, r9
    sub      r9, r7, r9, lsl #1
    add      lr, r3, #128
    ldmia    lr, {r10, r11}
    smull    lr, r12, r8, r11
    smlal    lr, r12, r9, r10
    movs     lr, lr, lsr #28
    adc      r12, lr, r12, lsl #4
    str      r12, [r4], #32
    cmp      r0, #0
    cmpne    r0, #8
    beq      .skip1
    smull    lr, r12, r8, r10
    rsb      r9, r9, #0
    smlal    lr, r12, r9, r11
    movs     lr, lr, lsr #28
    adc      r12, lr, r12, lsl #4
    add      lr, r5, r0, lsl #6
    str      r12, [lr, #-512]
.skip1:
    ldmia    r3!, {r10, r11}
    smull    lr, r12, r7, r10
    smlal    lr, r12, r6, r11
    movs     lr, lr, lsr #28
    adc      r12, lr, r12, lsl #4
    str      r12, [r5], #-32
    cmp      r0, #0
    cmpne    r0, #8
    beq      .skip2
    smull    lr, r12, r6, r10
    rsb      r7, r7, #0
    smlal    lr, r12, r7, r11
    movs     lr, lr, lsr #28
    adc      r12, lr, r12, lsl #4
    sub      lr, r4, r0, lsl #6
    str      r12, [lr, #480]
.skip2:
    add      r0, r0, #1
    cmp      r0, #9
    bne      .l4
    add      sp, sp, #144
    ldmia    sp!, {r4-r11, pc}
bitrev:
    .word 0x0
    .word 0x2
    .word 0x1
    .word 0x3

sincos:
    .word 0x0
    .word 0x10000000
    .word -0x31f1708
    .word 0xfb14be8
    .word -0x61f78aa
    .word 0xec835e8
    .word -0x8e39d9d
    .word 0xd4db315
    .word -0xb504f33
    .word 0xb504f33
    .word -0xd4db315
    .word 0x8e39d9d
    .word -0xec835e8
    .word 0x61f78aa
    .word -0xfb14be8
    .word 0x31f1708
    .word -0x10000000
    .word 0x0
    .word -0xfb14be8
    .word -0x31f1708
    .word -0xec835e8
    .word -0x61f78aa
    .word -0xd4db315
    .word -0x8e39d9d
    .word -0xb504f33
    .word -0xb504f33
    .word -0x8e39d9d
    .word -0xd4db315
    .word -0x61f78aa
    .word -0xec835e8
    .word -0x31f1708
    .word -0xfb14be8

sincos2:
    .word 0x0
    .word 0x8000000
    .word 0x647d98
    .word 0x7fd8879
    .word 0xc8bd36
    .word 0x7f62369
    .word 0x12c8107
    .word 0x7e9d560
    .word 0x18f8b84
    .word 0x7d8a5f4
    .word 0x1f19f98
    .word 0x7c29fbf
    .word 0x25280c6
    .word 0x7a7d056
    .word 0x2b1f34f
    .word 0x7884841
    .word 0x30fbc55
    .word 0x7641af4
    .word 0x36ba201
    .word 0x73b5ebd
    .word 0x3c56ba7
    .word 0x70e2cbc
    .word 0x41ce1e6
    .word 0x6dca0d1
    .word 0x471cece
    .word 0x6a6d98a
    .word 0x4c3fdff
    .word 0x66cf812
    .word 0x5133cc9
    .word 0x62f201b
    .word 0x55f5a4d
    .word 0x5ed77c9
    .word 0x5a8279a
    .word 0x5a8279a
    .word 0x5ed77c9
    .word 0x55f5a4d
    .word 0x62f201b
    .word 0x5133cc9
    .word 0x66cf812
    .word 0x4c3fdff
    .word 0x6a6d98a
    .word 0x471cece
    .word 0x6dca0d1
    .word 0x41ce1e6
    .word 0x70e2cbc
    .word 0x3c56ba7
    .word 0x73b5ebd
    .word 0x36ba201
    .word 0x7641af4
    .word 0x30fbc55
    .word 0x7884841
    .word 0x2b1f34f
    .word 0x7a7d056
    .word 0x25280c6
    .word 0x7c29fbf
    .word 0x1f19f98
    .word 0x7d8a5f4
    .word 0x18f8b84
    .word 0x7e9d560
    .word 0x12c8107
    .word 0x7f62369
    .word 0xc8bd36
    .word 0x7fd8879
    .word 0x647d98