diff options
Diffstat (limited to 'apps')
-rw-r--r-- | apps/dsp_cf.S | 214 |
1 files changed, 107 insertions, 107 deletions
diff --git a/apps/dsp_cf.S b/apps/dsp_cf.S index 233be82860..d832b9f0e8 100644 --- a/apps/dsp_cf.S +++ b/apps/dsp_cf.S | |||
@@ -20,8 +20,8 @@ | |||
20 | /**************************************************************************** | 20 | /**************************************************************************** |
21 | * apply_crossfeed(int32_t* src[], int count) | 21 | * apply_crossfeed(int32_t* src[], int count) |
22 | */ | 22 | */ |
23 | .section .text | 23 | .section .text |
24 | .global apply_crossfeed | 24 | .global apply_crossfeed |
25 | apply_crossfeed: | 25 | apply_crossfeed: |
26 | lea.l (-44, %sp), %sp | 26 | lea.l (-44, %sp), %sp |
27 | movem.l %d2-%d7/%a2-%a6, (%sp) | save all regs | 27 | movem.l %d2-%d7/%a2-%a6, (%sp) | save all regs |
@@ -85,137 +85,137 @@ apply_crossfeed: | |||
85 | lea.l (44, %sp), %sp | 85 | lea.l (44, %sp), %sp |
86 | rts | 86 | rts |
87 | .cfend: | 87 | .cfend: |
88 | .size apply_crossfeed,.cfend-apply_crossfeed | 88 | .size apply_crossfeed,.cfend-apply_crossfeed |
89 | 89 | ||
90 | /**************************************************************************** | 90 | /**************************************************************************** |
91 | * dsp_downsample(int channels, int count, struct resample_data *r, | 91 | * dsp_downsample(int channels, int count, struct resample_data *r, |
92 | * in32_t **src, int32_t **dst) | 92 | * in32_t **src, int32_t **dst) |
93 | */ | 93 | */ |
94 | .section .text | 94 | .section .text |
95 | .global dsp_downsample | 95 | .global dsp_downsample |
96 | dsp_downsample: | 96 | dsp_downsample: |
97 | lea.l -40(%sp), %sp | save non-clobberables | 97 | lea.l -40(%sp), %sp | save non-clobberables |
98 | movem.l %d2-%d7/%a2-%a5, (%sp) | | 98 | movem.l %d2-%d7/%a2-%a5, (%sp) | |
99 | movem.l 44(%sp), %d2-%d3/%a0-%a2| %d2 = ch = channels | 99 | movem.l 44(%sp), %d2-%d3/%a0-%a2| %d2 = ch = channels |
100 | | %d3 = count | 100 | | %d3 = count |
101 | | %a0 = r | 101 | | %a0 = r |
102 | | %a1 = src | 102 | | %a1 = src |
103 | | %a2 = dst | 103 | | %a2 = dst |
104 | move.l 4(%a0), %d4 | %d4 = delta = r->delta | 104 | move.l 4(%a0), %d4 | %d4 = delta = r->delta |
105 | move.l #16, %d7 | %d7 = shift | 105 | move.l #16, %d7 | %d7 = shift |
106 | .dschannel_loop: | 106 | .dschannel_loop: |
107 | move.l (%a0), %d5 | %d5 = phase = r->phase | 107 | move.l (%a0), %d5 | %d5 = phase = r->phase |
108 | move.l -4(%a1, %d2.l*4), %a3 | %a3 = s = src[ch-1] | 108 | move.l -4(%a1, %d2.l*4), %a3 | %a3 = s = src[ch-1] |
109 | move.l -4(%a2, %d2.l*4), %a4 | %a4 = d = dst[ch-1] | 109 | move.l -4(%a2, %d2.l*4), %a4 | %a4 = d = dst[ch-1] |
110 | lea.l 4(%a0, %d2.l*4), %a5 | %a5 = &r->last_sample[ch-1] | 110 | lea.l 4(%a0, %d2.l*4), %a5 | %a5 = &r->last_sample[ch-1] |
111 | move.l (%a5), %d0 | %d0 = last = r->last_sample[ch-1] | 111 | move.l (%a5), %d0 | %d0 = last = r->last_sample[ch-1] |
112 | move.l -4(%a3, %d3.l*4), %d1 | r->last_sample[ch-1] = s[count-1] | 112 | move.l -4(%a3, %d3.l*4), %d1 | r->last_sample[ch-1] = s[count-1] |
113 | move.l %d1, (%a5) | | 113 | move.l %d1, (%a5) | |
114 | move.l %d5, %d6 | %d6 = pos = phase >> 16 | 114 | move.l %d5, %d6 | %d6 = pos = phase >> 16 |
115 | lsr.l %d7, %d6 | | 115 | lsr.l %d7, %d6 | |
116 | cmp.l %d3, %d6 | past end of samples? | 116 | cmp.l %d3, %d6 | past end of samples? |
117 | bge.b .dsloop_skip | yes? skip loop | 117 | bge.b .dsloop_skip | yes? skip loop |
118 | tst.l %d6 | need last sample of prev. frame? | 118 | tst.l %d6 | need last sample of prev. frame? |
119 | bne.b .dsloop | no? start main loop | 119 | bne.b .dsloop | no? start main loop |
120 | move.l (%a3, %d6.l*4), %d1 | %d1 = s[pos] | 120 | move.l (%a3, %d6.l*4), %d1 | %d1 = s[pos] |
121 | bra.b .dsuse_last_start | start with last (last in %d0) | 121 | bra.b .dsuse_last_start | start with last (last in %d0) |
122 | .dsloop: | 122 | .dsloop: |
123 | lea.l -4(%a3, %d6.l*4), %a5 | load s[pos-1] and s[pos] | 123 | lea.l -4(%a3, %d6.l*4), %a5 | load s[pos-1] and s[pos] |
124 | movem.l (%a5), %d0-%d1 | | 124 | movem.l (%a5), %d0-%d1 | |
125 | .dsuse_last_start: | 125 | .dsuse_last_start: |
126 | sub.l %d0, %d1 | %d1 = diff = s[pos] - s[pos-1] | 126 | sub.l %d0, %d1 | %d1 = diff = s[pos] - s[pos-1] |
127 | move.l %d0, %acc0 | %acc0 = previous sample | 127 | move.l %d0, %acc0 | %acc0 = previous sample |
128 | move.l %d5, %d0 | frac = (phase << 16) >> 1 | 128 | move.l %d5, %d0 | frac = (phase << 16) >> 1 |
129 | lsl.l %d7, %d0 | | 129 | lsl.l %d7, %d0 | |
130 | lsr.l #1, %d0 | | 130 | lsr.l #1, %d0 | |
131 | mac.l %d0, %d1, %acc0 | %acc0 += frac * diff | 131 | mac.l %d0, %d1, %acc0 | %acc0 += frac * diff |
132 | move.l %acc0, %d0 | | 132 | move.l %acc0, %d0 | |
133 | add.l %d4, %d5 | phase += delta | 133 | add.l %d4, %d5 | phase += delta |
134 | move.l %d5, %d6 | pos = phase >> 16 | 134 | move.l %d5, %d6 | pos = phase >> 16 |
135 | lsr.l %d7, %d6 | | 135 | lsr.l %d7, %d6 | |
136 | move.l %d0, (%a4)+ | *d++ = %d0 | 136 | move.l %d0, (%a4)+ | *d++ = %d0 |
137 | cmp.l %d3, %d6 | pos < count? | 137 | cmp.l %d3, %d6 | pos < count? |
138 | blt.b .dsloop | yes? continue resampling | 138 | blt.b .dsloop | yes? continue resampling |
139 | .dsloop_skip: | 139 | .dsloop_skip: |
140 | subq.l #1, %d2 | ch > 0? | 140 | subq.l #1, %d2 | ch > 0? |
141 | bgt.b .dschannel_loop | yes? process next channel | 141 | bgt.b .dschannel_loop | yes? process next channel |
142 | asl.l %d7, %d3 | wrap phase to start of next frame | 142 | asl.l %d7, %d3 | wrap phase to start of next frame |
143 | sub.l %d3, %d5 | r->phase = phase - (count << 16) | 143 | sub.l %d3, %d5 | r->phase = phase - (count << 16) |
144 | move.l %d5, (%a0) | | 144 | move.l %d5, (%a0) | |
145 | move.l %a4, %d0 | return d - d[0] | 145 | move.l %a4, %d0 | return d - d[0] |
146 | sub.l (%a2), %d0 | | 146 | sub.l (%a2), %d0 | |
147 | asr.l #2, %d0 | convert bytes->samples | 147 | asr.l #2, %d0 | convert bytes->samples |
148 | movem.l (%sp), %d2-%d7/%a2-%a5 | restore non-clobberables | 148 | movem.l (%sp), %d2-%d7/%a2-%a5 | restore non-clobberables |
149 | move.l %acc1, %acc0 | clear %acc0 | 149 | move.l %acc1, %acc0 | clear %acc0 |
150 | lea.l 40(%sp), %sp | cleanup stack | 150 | lea.l 40(%sp), %sp | cleanup stack |
151 | rts | buh-bye | 151 | rts | buh-bye |
152 | .dsend: | 152 | .dsend: |
153 | .size dsp_downsample,.dsend-dsp_downsample | 153 | .size dsp_downsample,.dsend-dsp_downsample |
154 | 154 | ||
155 | /**************************************************************************** | 155 | /**************************************************************************** |
156 | * dsp_upsample(int channels, int count, struct resample_data *r, | 156 | * dsp_upsample(int channels, int count, struct resample_data *r, |
157 | * in32_t **src, int32_t **dst) | 157 | * in32_t **src, int32_t **dst) |
158 | */ | 158 | */ |
159 | .section .text | 159 | .section .text |
160 | .global dsp_upsample | 160 | .global dsp_upsample |
161 | dsp_upsample: | 161 | dsp_upsample: |
162 | lea.l -40(%sp), %sp | save non-clobberables | 162 | lea.l -40(%sp), %sp | save non-clobberables |
163 | movem.l %d2-%d7/%a2-%a5, (%sp) | | 163 | movem.l %d2-%d7/%a2-%a5, (%sp) | |
164 | movem.l 44(%sp), %d2-%d3/%a0-%a2| %d2 = ch = channels | 164 | movem.l 44(%sp), %d2-%d3/%a0-%a2| %d2 = ch = channels |
165 | | %d3 = count | 165 | | %d3 = count |
166 | | %a0 = r | 166 | | %a0 = r |
167 | | %a1 = src | 167 | | %a1 = src |
168 | | %a2 = dst | 168 | | %a2 = dst |
169 | move.l 4(%a0), %d4 | %d4 = delta = r->delta | 169 | move.l 4(%a0), %d4 | %d4 = delta = r->delta |
170 | swap %d4 | swap delta to high word to use | 170 | swap %d4 | swap delta to high word to use |
171 | | carries to increment position | 171 | | carries to increment position |
172 | .uschannel_loop: | 172 | .uschannel_loop: |
173 | move.l (%a0), %d5 | %d5 = phase = r->phase | 173 | move.l (%a0), %d5 | %d5 = phase = r->phase |
174 | move.l -4(%a1, %d2.l*4), %a3 | %a3 = s = src[ch-1] | 174 | move.l -4(%a1, %d2.l*4), %a3 | %a3 = s = src[ch-1] |
175 | move.l -4(%a2, %d2.l*4), %a4 | %a4 = d = dst[ch-1] | 175 | move.l -4(%a2, %d2.l*4), %a4 | %a4 = d = dst[ch-1] |
176 | lea.l 4(%a0, %d2.l*4), %a5 | %a5 = &r->last_sample[ch-1] | 176 | lea.l 4(%a0, %d2.l*4), %a5 | %a5 = &r->last_sample[ch-1] |
177 | move.l (%a5), %d0 | %d0 = last = r->last_sample[ch-1] | 177 | move.l (%a5), %d0 | %d0 = last = r->last_sample[ch-1] |
178 | move.l -4(%a3, %d3.l*4), %d1 | r->last_sample[ch-1] = s[count-1] | 178 | move.l -4(%a3, %d3.l*4), %d1 | r->last_sample[ch-1] = s[count-1] |
179 | move.l %d1, (%a5) | | 179 | move.l %d1, (%a5) | |
180 | moveq.l #16, %d1 | %d0 = shift | 180 | moveq.l #16, %d1 | %d0 = shift |
181 | move.l %d5, %d6 | %d6 = pos = phase >> 16 | 181 | move.l %d5, %d6 | %d6 = pos = phase >> 16 |
182 | lsl.l %d1, %d5 | swap phase to high word to use | 182 | lsl.l %d1, %d5 | swap phase to high word to use |
183 | | carries to increment position | 183 | | carries to increment position |
184 | lsr.l %d1, %d6 | pos == 0? | 184 | lsr.l %d1, %d6 | pos == 0? |
185 | bne.b .usstart_1 | no? transistion from down | 185 | bne.b .usstart_1 | no? transistion from down |
186 | move.l (%a3), %d1 | %d1 = s[0] | 186 | move.l (%a3), %d1 | %d1 = s[0] |
187 | sub.l %d0, %d1 | diff = s[pos] - last | 187 | sub.l %d0, %d1 | diff = s[pos] - last |
188 | bra.b .usloop_0 | jump to typical start point | 188 | bra.b .usloop_0 | jump to typical start point |
189 | .usstart_1: | 189 | .usstart_1: |
190 | cmp.l %d3, %d6 | past end of samples? | 190 | cmp.l %d3, %d6 | past end of samples? |
191 | bge.b .usloop_skip | yes? skip loop | 191 | bge.b .usloop_skip | yes? skip loop |
192 | .usloop_1: | 192 | .usloop_1: |
193 | lea.l -4(%a3, %d6.l*4), %a5 | load s[pos-1] and s[pos] | 193 | lea.l -4(%a3, %d6.l*4), %a5 | load s[pos-1] and s[pos] |
194 | movem.l (%a5), %d0-%d1 | | 194 | movem.l (%a5), %d0-%d1 | |
195 | sub.l %d0, %d1 | %d1 = diff = s[pos] - s[pos-1] | 195 | sub.l %d0, %d1 | %d1 = diff = s[pos] - s[pos-1] |
196 | .usloop_0: | 196 | .usloop_0: |
197 | move.l %d0, %acc0 | %acc0 = previous sample | 197 | move.l %d0, %acc0 | %acc0 = previous sample |
198 | lsr.l #1, %d5 | make phase into frac | 198 | lsr.l #1, %d5 | make phase into frac |
199 | mac.l %d1, %d5, %acc0 | %acc0 += diff * frac | 199 | mac.l %d1, %d5, %acc0 | %acc0 += diff * frac |
200 | move.l %acc0, %d7 | | 200 | move.l %acc0, %d7 | |
201 | lsl.l #1, %d5 | restore frac to phase | 201 | lsl.l #1, %d5 | restore frac to phase |
202 | move.l %d7, (%a4)+ | *d++ = %d0 | 202 | move.l %d7, (%a4)+ | *d++ = %d0 |
203 | add.l %d4, %d5 | phase += delta | 203 | add.l %d4, %d5 | phase += delta |
204 | bcc.b .usloop_0 | load next values? | 204 | bcc.b .usloop_0 | load next values? |
205 | addq.l #1, %d6 | increment position | 205 | addq.l #1, %d6 | increment position |
206 | cmp.l %d3, %d6 | pos < count? | 206 | cmp.l %d3, %d6 | pos < count? |
207 | blt.b .usloop_1 | yes? continue resampling | 207 | blt.b .usloop_1 | yes? continue resampling |
208 | .usloop_skip: | 208 | .usloop_skip: |
209 | subq.l #1, %d2 | ch > 0? | 209 | subq.l #1, %d2 | ch > 0? |
210 | bgt.b .uschannel_loop | yes? process next channel | 210 | bgt.b .uschannel_loop | yes? process next channel |
211 | swap %d5 | wrap phase to start of next frame | 211 | swap %d5 | wrap phase to start of next frame |
212 | move.l %d5, (%a0) | ...and save in r->phase | 212 | move.l %d5, (%a0) | ...and save in r->phase |
213 | move.l %a4, %d0 | return d - d[0] | 213 | move.l %a4, %d0 | return d - d[0] |
214 | sub.l (%a2), %d0 | | 214 | sub.l (%a2), %d0 | |
215 | asr.l #2, %d0 | convert bytes->samples | 215 | asr.l #2, %d0 | convert bytes->samples |
216 | movem.l (%sp), %d2-%d7/%a2-%a5 | restore non-clobberables | 216 | movem.l (%sp), %d2-%d7/%a2-%a5 | restore non-clobberables |
217 | move.l %acc1, %acc0 | clear %acc0 | 217 | move.l %acc1, %acc0 | clear %acc0 |
218 | lea.l 40(%sp), %sp | cleanup stack | 218 | lea.l 40(%sp), %sp | cleanup stack |
219 | rts | buh-bye | 219 | rts | buh-bye |
220 | .usend: | 220 | .usend: |
221 | .size dsp_upsample,.usend-dsp_upsample | 221 | .size dsp_upsample,.usend-dsp_upsample |