2 * (C) GraÅžvydas "notaz" Ignotas, 2011
4 * This work is licensed under the terms of any of these licenses
6 * - GNU GPL, version 2 or later.
7 * - GNU LGPL, version 2.1 or later.
8 * See the COPYING file in the top-level directory.
11 #include "arm_features.h"
16 .macro load_varadr reg var
17 #if defined(__ARM_ARCH_7A__) && !defined(__PIC__)
18 movw \reg, #:lower16:EVAR(\var)
19 movt \reg, #:upper16:EVAR(\var)
27 FUNCTION(mix_chan): @ (int start, int count, int lv, int rv)
29 vmov.32 d14[1], r3 @ multipliers
31 load_varadr r0, ChanBuf
32 load_varadr r2, SSumLR
38 vmul.s32 d10, d14, d0[0]
39 vmul.s32 d11, d14, d0[1]
40 vmul.s32 d12, d14, d1[0]
41 vmul.s32 d13, d14, d1[1]
60 FUNCTION(mix_chan_rvb): @ (int start, int count, int lv, int rv)
62 vmov.32 d14[1], r3 @ multipliers
64 load_varadr r0, ChanBuf
65 load_varadr r3, sRVBStart
66 load_varadr r2, SSumLR
75 vmul.s32 d10, d14, d0[0]
76 vmul.s32 d11, d14, d0[1]
77 vmul.s32 d12, d14, d1[0]
78 vmul.s32 d13, d14, d1[1]
102 #elif defined(HAVE_ARMV5)
104 FUNCTION(mix_chan): @ (int start, int count, int lv, int rv)
105 stmfd sp!, {r4-r8,lr}
106 orr r3, r2, r3, lsl #16
107 lsl r3, #1 @ packed multipliers << 1
109 load_varadr r0, ChanBuf
110 load_varadr r2, SSumLR
116 lsl r4, #1 @ adjust for mul
118 smlawb r6, r4, r3, r6
119 smlawt r7, r4, r3, r7
120 smlawb r8, r5, r3, r8
121 smlawt lr, r5, r3, lr
124 stmia r2!, {r6-r8,lr}
126 ldmeqfd sp!, {r4-r8,pc}
130 ldmfd sp!, {r4-r8,pc}
133 FUNCTION(mix_chan_rvb): @ (int start, int count, int lv, int rv)
134 stmfd sp!, {r4-r8,lr}
135 orr lr, r2, r3, lsl #16
137 load_varadr r3, sRVBStart
138 load_varadr r2, SSumLR
139 load_varadr r4, ChanBuf
141 add r2, r2, r0, lsl #3
142 add r3, r3, r0, lsl #3
143 add r0, r4, r0, lsl #2
149 smlawb r6, r4, lr, r6 @ supposedly takes single cycle?
150 smlawt r7, r4, lr, r7
151 smlawb r8, r4, lr, r8
152 smlawt r12,r4, lr, r12
157 ldmfd sp!, {r4-r8,pc}
161 @ vim:filetype=armasm