Go to the documentation of this file.
30 int dstStride,
int srcStride,
int h)
37 MMI_ULWC1(%[ftmp0], %[
src], 0x00)
38 MMI_SWC1(%[ftmp0], %[
dst], 0x00)
39 "addi %[h], %[h], -0x01 \n\t"
40 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
41 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
43 : [ftmp0]
"=&f"(ftmp[0]),
47 : [dstStride]
"r"((
mips_reg)dstStride),
54 int dstStride,
int srcStride,
int h)
61 MMI_ULDC1(%[ftmp0], %[
src], 0x00)
62 MMI_SDC1(%[ftmp0], %[
dst], 0x00)
63 "addi %[h], %[h], -0x01 \n\t"
64 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
65 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
67 : [ftmp0]
"=&f"(ftmp[0]),
71 : [dstStride]
"r"((
mips_reg)dstStride),
78 int dstStride,
int srcStride,
int h)
86 MMI_ULDC1(%[ftmp0], %[
src], 0x00)
87 "ldl %[tmp0], 0x0f(%[src]) \n\t"
88 "ldr %[tmp0], 0x08(%[src]) \n\t"
89 MMI_SDC1(%[ftmp0], %[
dst], 0x00)
90 "sdl %[tmp0], 0x0f(%[dst]) \n\t"
91 "sdr %[tmp0], 0x08(%[dst]) \n\t"
92 "addi %[h], %[h], -0x01 \n\t"
93 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
94 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
96 : [ftmp0]
"=&f"(ftmp[0]),
101 : [dstStride]
"r"((
mips_reg)dstStride),
107 #define op2_avg(a, b) a = (((a)+CLIP(((b) + 512)>>10)+1)>>1)
108 #define op2_put(a, b) a = CLIP(((b) + 512)>>10)
110 int dstStride,
int srcStride)
117 "pxor %[ftmp0], %[ftmp0], %[ftmp0] \n\t"
118 "dli %[tmp0], 0x04 \n\t"
120 MMI_ULWC1(%[ftmp1], %[
src], -0x02)
121 MMI_ULWC1(%[ftmp2], %[
src], -0x01)
122 MMI_ULWC1(%[ftmp3], %[
src], 0x00)
123 MMI_ULWC1(%[ftmp4], %[
src], 0x01)
124 MMI_ULWC1(%[ftmp5], %[
src], 0x02)
125 MMI_ULWC1(%[ftmp6], %[
src], 0x03)
127 "punpcklbh %[ftmp1], %[ftmp1], %[ftmp0] \n\t"
128 "punpcklbh %[ftmp2], %[ftmp2], %[ftmp0] \n\t"
129 "punpcklbh %[ftmp3], %[ftmp3], %[ftmp0] \n\t"
130 "punpcklbh %[ftmp4], %[ftmp4], %[ftmp0] \n\t"
131 "punpcklbh %[ftmp5], %[ftmp5], %[ftmp0] \n\t"
132 "punpcklbh %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
133 "paddsh %[ftmp7], %[ftmp3], %[ftmp4] \n\t"
134 "paddsh %[ftmp8], %[ftmp2], %[ftmp5] \n\t"
135 "paddsh %[ftmp9], %[ftmp1], %[ftmp6] \n\t"
136 "pmullh %[ftmp7], %[ftmp7], %[ff_pw_20] \n\t"
137 "pmullh %[ftmp8], %[ftmp8], %[ff_pw_5] \n\t"
138 "psubsh %[ftmp7], %[ftmp7], %[ftmp8] \n\t"
139 "paddsh %[ftmp9], %[ftmp7], %[ftmp9] \n\t"
140 "paddsh %[ftmp9], %[ftmp9], %[ff_pw_16] \n\t"
141 "psrah %[ftmp9], %[ftmp9], %[ff_pw_5] \n\t"
142 "packushb %[ftmp9], %[ftmp9], %[ftmp0] \n\t"
143 MMI_SWC1(%[ftmp9], %[
dst], 0x00)
144 "daddi %[tmp0], %[tmp0], -0x01 \n\t"
145 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
146 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
147 "bnez %[tmp0], 1b \n\t"
148 : [ftmp0]
"=&f"(ftmp[0]), [ftmp1]
"=&f"(ftmp[1]),
149 [ftmp2]
"=&f"(ftmp[2]), [ftmp3]
"=&f"(ftmp[3]),
150 [ftmp4]
"=&f"(ftmp[4]), [ftmp5]
"=&f"(ftmp[5]),
151 [ftmp6]
"=&f"(ftmp[6]), [ftmp7]
"=&f"(ftmp[7]),
152 [ftmp8]
"=&f"(ftmp[8]), [ftmp9]
"=&f"(ftmp[9]),
156 : [dstStride]
"r"((
mips_reg)dstStride),
157 [srcStride]
"r"((
mips_reg)srcStride),
165 int dstStride,
int srcStride)
172 "pxor %[ftmp0], %[ftmp0], %[ftmp0] \n\t"
173 "dli %[tmp0], 0x08 \n\t"
175 MMI_ULDC1(%[ftmp1], %[
src], -0x02)
176 MMI_ULDC1(%[ftmp2], %[
src], -0x01)
177 MMI_ULDC1(%[ftmp3], %[
src], 0x00)
178 MMI_ULDC1(%[ftmp4], %[
src], 0x01)
179 MMI_ULDC1(%[ftmp5], %[
src], 0x02)
180 MMI_ULDC1(%[ftmp6], %[
src], 0x03)
181 "punpcklbh %[ftmp7], %[ftmp3], %[ftmp0] \n\t"
182 "punpckhbh %[ftmp8], %[ftmp3], %[ftmp0] \n\t"
183 "punpcklbh %[ftmp9], %[ftmp4], %[ftmp0] \n\t"
184 "punpckhbh %[ftmp10], %[ftmp4], %[ftmp0] \n\t"
185 "paddsh %[ftmp3], %[ftmp7], %[ftmp9] \n\t"
186 "paddsh %[ftmp4], %[ftmp8], %[ftmp10] \n\t"
187 "pmullh %[ftmp3], %[ftmp3], %[ff_pw_20] \n\t"
188 "pmullh %[ftmp4], %[ftmp4], %[ff_pw_20] \n\t"
189 "punpcklbh %[ftmp7], %[ftmp2], %[ftmp0] \n\t"
190 "punpckhbh %[ftmp8], %[ftmp2], %[ftmp0] \n\t"
191 "punpcklbh %[ftmp9], %[ftmp5], %[ftmp0] \n\t"
192 "punpckhbh %[ftmp10], %[ftmp5], %[ftmp0] \n\t"
193 "paddsh %[ftmp2], %[ftmp7], %[ftmp9] \n\t"
194 "paddsh %[ftmp5], %[ftmp8], %[ftmp10] \n\t"
195 "pmullh %[ftmp2], %[ftmp2], %[ff_pw_5] \n\t"
196 "pmullh %[ftmp5], %[ftmp5], %[ff_pw_5] \n\t"
197 "punpcklbh %[ftmp7], %[ftmp1], %[ftmp0] \n\t"
198 "punpckhbh %[ftmp8], %[ftmp1], %[ftmp0] \n\t"
199 "punpcklbh %[ftmp9], %[ftmp6], %[ftmp0] \n\t"
200 "punpckhbh %[ftmp10], %[ftmp6], %[ftmp0] \n\t"
201 "paddsh %[ftmp1], %[ftmp7], %[ftmp9] \n\t"
202 "paddsh %[ftmp6], %[ftmp8], %[ftmp10] \n\t"
203 "psubsh %[ftmp3], %[ftmp3], %[ftmp2] \n\t"
204 "psubsh %[ftmp4], %[ftmp4], %[ftmp5] \n\t"
205 "paddsh %[ftmp3], %[ftmp3], %[ftmp1] \n\t"
206 "paddsh %[ftmp4], %[ftmp4], %[ftmp6] \n\t"
207 "paddsh %[ftmp3], %[ftmp3], %[ff_pw_16] \n\t"
208 "paddsh %[ftmp4], %[ftmp4], %[ff_pw_16] \n\t"
209 "psrah %[ftmp3], %[ftmp3], %[ff_pw_5] \n\t"
210 "psrah %[ftmp4], %[ftmp4], %[ff_pw_5] \n\t"
211 "packushb %[ftmp9], %[ftmp3], %[ftmp4] \n\t"
212 MMI_SDC1(%[ftmp9], %[
dst], 0x00)
213 "daddi %[tmp0], %[tmp0], -0x01 \n\t"
214 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
215 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
216 "bnez %[tmp0], 1b \n\t"
217 : [ftmp0]
"=&f"(ftmp[0]), [ftmp1]
"=&f"(ftmp[1]),
218 [ftmp2]
"=&f"(ftmp[2]), [ftmp3]
"=&f"(ftmp[3]),
219 [ftmp4]
"=&f"(ftmp[4]), [ftmp5]
"=&f"(ftmp[5]),
220 [ftmp6]
"=&f"(ftmp[6]), [ftmp7]
"=&f"(ftmp[7]),
221 [ftmp8]
"=&f"(ftmp[8]), [ftmp9]
"=&f"(ftmp[9]),
222 [ftmp10]
"=&f"(ftmp[10]),
226 : [dstStride]
"r"((
mips_reg)dstStride),
227 [srcStride]
"r"((
mips_reg)srcStride),
235 int dstStride,
int srcStride)
246 int dstStride,
int srcStride)
253 "pxor %[ftmp0], %[ftmp0], %[ftmp0] \n\t"
254 "dli %[tmp0], 0x04 \n\t"
256 MMI_ULWC1(%[ftmp1], %[
src], -0x02)
257 MMI_ULWC1(%[ftmp2], %[
src], -0x01)
258 MMI_ULWC1(%[ftmp3], %[
src], 0x00)
259 MMI_ULWC1(%[ftmp4], %[
src], 0x01)
260 MMI_ULWC1(%[ftmp5], %[
src], 0x02)
261 MMI_ULWC1(%[ftmp6], %[
src], 0x03)
262 "punpcklbh %[ftmp1], %[ftmp1], %[ftmp0] \n\t"
263 "punpcklbh %[ftmp2], %[ftmp2], %[ftmp0] \n\t"
264 "punpcklbh %[ftmp3], %[ftmp3], %[ftmp0] \n\t"
265 "punpcklbh %[ftmp4], %[ftmp4], %[ftmp0] \n\t"
266 "punpcklbh %[ftmp5], %[ftmp5], %[ftmp0] \n\t"
267 "punpcklbh %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
268 "paddsh %[ftmp7], %[ftmp3], %[ftmp4] \n\t"
269 "paddsh %[ftmp8], %[ftmp2], %[ftmp5] \n\t"
270 "paddsh %[ftmp9], %[ftmp1], %[ftmp6] \n\t"
271 "pmullh %[ftmp7], %[ftmp7], %[ff_pw_20] \n\t"
272 "pmullh %[ftmp8], %[ftmp8], %[ff_pw_5] \n\t"
273 "psubsh %[ftmp7], %[ftmp7], %[ftmp8] \n\t"
274 "paddsh %[ftmp9], %[ftmp7], %[ftmp9] \n\t"
275 "paddsh %[ftmp9], %[ftmp9], %[ff_pw_16] \n\t"
276 "psrah %[ftmp9], %[ftmp9], %[ff_pw_5] \n\t"
277 "packushb %[ftmp9], %[ftmp9], %[ftmp0] \n\t"
278 MMI_LWC1(%[ftmp10], %[
dst], 0x00)
279 "pavgb %[ftmp9], %[ftmp9], %[ftmp10] \n\t"
280 MMI_SWC1(%[ftmp9], %[
dst], 0x00)
281 "daddi %[tmp0], %[tmp0], -0x01 \n\t"
282 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
283 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
284 "bnez %[tmp0], 1b \n\t"
285 : [ftmp0]
"=&f"(ftmp[0]), [ftmp1]
"=&f"(ftmp[1]),
286 [ftmp2]
"=&f"(ftmp[2]), [ftmp3]
"=&f"(ftmp[3]),
287 [ftmp4]
"=&f"(ftmp[4]), [ftmp5]
"=&f"(ftmp[5]),
288 [ftmp6]
"=&f"(ftmp[6]), [ftmp7]
"=&f"(ftmp[7]),
289 [ftmp8]
"=&f"(ftmp[8]), [ftmp9]
"=&f"(ftmp[9]),
290 [ftmp10]
"=&f"(ftmp[10]),
294 : [dstStride]
"r"((
mips_reg)dstStride),
295 [srcStride]
"r"((
mips_reg)srcStride),
303 int dstStride,
int srcStride)
310 "pxor %[ftmp0], %[ftmp0], %[ftmp0] \n\t"
311 "dli %[tmp0], 0x08 \n\t"
313 MMI_ULDC1(%[ftmp1], %[
src], -0x02)
314 MMI_ULDC1(%[ftmp2], %[
src], -0x01)
315 MMI_ULDC1(%[ftmp3], %[
src], 0x00)
316 MMI_ULDC1(%[ftmp4], %[
src], 0x01)
317 MMI_ULDC1(%[ftmp5], %[
src], 0x02)
318 MMI_ULDC1(%[ftmp6], %[
src], 0x03)
319 "punpcklbh %[ftmp7], %[ftmp3], %[ftmp0] \n\t"
320 "punpckhbh %[ftmp8], %[ftmp3], %[ftmp0] \n\t"
321 "punpcklbh %[ftmp9], %[ftmp4], %[ftmp0] \n\t"
322 "punpckhbh %[ftmp10], %[ftmp4], %[ftmp0] \n\t"
323 "paddsh %[ftmp3], %[ftmp7], %[ftmp9] \n\t"
324 "paddsh %[ftmp4], %[ftmp8], %[ftmp10] \n\t"
325 "pmullh %[ftmp3], %[ftmp3], %[ff_pw_20] \n\t"
326 "pmullh %[ftmp4], %[ftmp4], %[ff_pw_20] \n\t"
327 "punpcklbh %[ftmp7], %[ftmp2], %[ftmp0] \n\t"
328 "punpckhbh %[ftmp8], %[ftmp2], %[ftmp0] \n\t"
329 "punpcklbh %[ftmp9], %[ftmp5], %[ftmp0] \n\t"
330 "punpckhbh %[ftmp10], %[ftmp5], %[ftmp0] \n\t"
331 "paddsh %[ftmp2], %[ftmp7], %[ftmp9] \n\t"
332 "paddsh %[ftmp5], %[ftmp8], %[ftmp10] \n\t"
333 "pmullh %[ftmp2], %[ftmp2], %[ff_pw_5] \n\t"
334 "pmullh %[ftmp5], %[ftmp5], %[ff_pw_5] \n\t"
335 "punpcklbh %[ftmp7], %[ftmp1], %[ftmp0] \n\t"
336 "punpckhbh %[ftmp8], %[ftmp1], %[ftmp0] \n\t"
337 "punpcklbh %[ftmp9], %[ftmp6], %[ftmp0] \n\t"
338 "punpckhbh %[ftmp10], %[ftmp6], %[ftmp0] \n\t"
339 "paddsh %[ftmp1], %[ftmp7], %[ftmp9] \n\t"
340 "paddsh %[ftmp6], %[ftmp8], %[ftmp10] \n\t"
341 "psubsh %[ftmp3], %[ftmp3], %[ftmp2] \n\t"
342 "psubsh %[ftmp4], %[ftmp4], %[ftmp5] \n\t"
343 "paddsh %[ftmp3], %[ftmp3], %[ftmp1] \n\t"
344 "paddsh %[ftmp4], %[ftmp4], %[ftmp6] \n\t"
345 "paddsh %[ftmp3], %[ftmp3], %[ff_pw_16] \n\t"
346 "paddsh %[ftmp4], %[ftmp4], %[ff_pw_16] \n\t"
347 "psrah %[ftmp3], %[ftmp3], %[ff_pw_5] \n\t"
348 "psrah %[ftmp4], %[ftmp4], %[ff_pw_5] \n\t"
349 "packushb %[ftmp9], %[ftmp3], %[ftmp4] \n\t"
350 MMI_LDC1(%[ftmp10], %[
dst], 0x00)
351 "pavgb %[ftmp9], %[ftmp9], %[ftmp10] \n\t"
352 MMI_SDC1(%[ftmp9], %[
dst], 0x00)
353 "daddi %[tmp0], %[tmp0], -0x01 \n\t"
354 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
355 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
356 "bnez %[tmp0], 1b \n\t"
357 : [ftmp0]
"=&f"(ftmp[0]), [ftmp1]
"=&f"(ftmp[1]),
358 [ftmp2]
"=&f"(ftmp[2]), [ftmp3]
"=&f"(ftmp[3]),
359 [ftmp4]
"=&f"(ftmp[4]), [ftmp5]
"=&f"(ftmp[5]),
360 [ftmp6]
"=&f"(ftmp[6]), [ftmp7]
"=&f"(ftmp[7]),
361 [ftmp8]
"=&f"(ftmp[8]), [ftmp9]
"=&f"(ftmp[9]),
362 [ftmp10]
"=&f"(ftmp[10]),
366 : [dstStride]
"r"((
mips_reg)dstStride),
367 [srcStride]
"r"((
mips_reg)srcStride),
375 int dstStride,
int srcStride)
386 int dstStride,
int srcStride)
392 src -= 2 * srcStride;
396 ".set noreorder \n\t"
397 "pxor %[ftmp0], %[ftmp0], %[ftmp0] \n\t"
398 "dli %[tmp0], 0x02 \n\t"
399 MMI_LWC1(%[ftmp1], %[
src], 0x00)
400 "mtc1 %[tmp0], %[ftmp10] \n\t"
401 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
402 "dli %[tmp0], 0x05 \n\t"
403 MMI_LWC1(%[ftmp2], %[
src], 0x00)
404 "mtc1 %[tmp0], %[ftmp11] \n\t"
405 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
406 MMI_LWC1(%[ftmp3], %[
src], 0x00)
407 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
408 MMI_LWC1(%[ftmp4], %[
src], 0x00)
409 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
410 MMI_LWC1(%[ftmp5], %[
src], 0x00)
411 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
412 "punpcklbh %[ftmp1], %[ftmp1], %[ftmp0] \n\t"
413 "punpcklbh %[ftmp2], %[ftmp2], %[ftmp0] \n\t"
414 "punpcklbh %[ftmp3], %[ftmp3], %[ftmp0] \n\t"
415 "punpcklbh %[ftmp4], %[ftmp4], %[ftmp0] \n\t"
416 "punpcklbh %[ftmp5], %[ftmp5], %[ftmp0] \n\t"
417 MMI_LWC1(%[ftmp6], %[
src], 0x00)
418 "paddh %[ftmp7], %[ftmp3], %[ftmp4] \n\t"
419 "psllh %[ftmp7], %[ftmp7], %[ftmp10] \n\t"
420 "psubh %[ftmp7], %[ftmp7], %[ftmp2] \n\t"
421 "psubh %[ftmp7], %[ftmp7], %[ftmp5] \n\t"
422 "punpcklbh %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
423 "pmullh %[ftmp7], %[ftmp7], %[ff_pw_5] \n\t"
424 "paddh %[ftmp1], %[ftmp1], %[ff_pw_16] \n\t"
425 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
426 "paddh %[ftmp1], %[ftmp1], %[ftmp6] \n\t"
427 "paddh %[ftmp7], %[ftmp7], %[ftmp1] \n\t"
428 "psrah %[ftmp7], %[ftmp7], %[ftmp11] \n\t"
429 "packushb %[ftmp7], %[ftmp7], %[ftmp7] \n\t"
430 MMI_SWC1(%[ftmp7], %[
dst], 0x00)
431 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
432 MMI_LWC1(%[ftmp1], %[
src], 0x00)
433 "paddh %[ftmp7], %[ftmp4], %[ftmp5] \n\t"
434 "psllh %[ftmp7], %[ftmp7], %[ftmp10] \n\t"
435 "psubh %[ftmp7], %[ftmp7], %[ftmp3] \n\t"
436 "psubh %[ftmp7], %[ftmp7], %[ftmp6] \n\t"
437 "punpcklbh %[ftmp1], %[ftmp1], %[ftmp0] \n\t"
438 "pmullh %[ftmp7], %[ftmp7], %[ff_pw_5] \n\t"
439 "paddh %[ftmp2], %[ftmp2], %[ff_pw_16] \n\t"
440 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
441 "paddh %[ftmp2], %[ftmp2], %[ftmp1] \n\t"
442 "paddh %[ftmp7], %[ftmp7], %[ftmp2] \n\t"
443 "psrah %[ftmp7], %[ftmp7], %[ftmp11] \n\t"
444 "packushb %[ftmp7], %[ftmp7], %[ftmp7] \n\t"
445 MMI_SWC1(%[ftmp7], %[
dst], 0x00)
446 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
447 MMI_LWC1(%[ftmp2], %[
src], 0x00)
448 "paddh %[ftmp7], %[ftmp5], %[ftmp6] \n\t"
449 "psllh %[ftmp7], %[ftmp7], %[ftmp10] \n\t"
450 "psubh %[ftmp7], %[ftmp7], %[ftmp4] \n\t"
451 "psubh %[ftmp7], %[ftmp7], %[ftmp1] \n\t"
452 "punpcklbh %[ftmp2], %[ftmp2], %[ftmp0] \n\t"
453 "pmullh %[ftmp7], %[ftmp7], %[ff_pw_5] \n\t"
454 "paddh %[ftmp3], %[ftmp3], %[ff_pw_16] \n\t"
455 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
456 "paddh %[ftmp3], %[ftmp3], %[ftmp2] \n\t"
457 "paddh %[ftmp7], %[ftmp7], %[ftmp3] \n\t"
458 "psrah %[ftmp7], %[ftmp7], %[ftmp11] \n\t"
459 "packushb %[ftmp7], %[ftmp7], %[ftmp7] \n\t"
460 MMI_SWC1(%[ftmp7], %[
dst], 0x00)
461 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
462 MMI_LWC1(%[ftmp3], %[
src], 0x00)
463 "paddh %[ftmp7], %[ftmp6], %[ftmp1] \n\t"
464 "psllh %[ftmp7], %[ftmp7], %[ftmp10] \n\t"
465 "psubh %[ftmp7], %[ftmp7], %[ftmp5] \n\t"
466 "psubh %[ftmp7], %[ftmp7], %[ftmp2] \n\t"
467 "punpcklbh %[ftmp3], %[ftmp3], %[ftmp0] \n\t"
468 "pmullh %[ftmp7], %[ftmp7], %[ff_pw_5] \n\t"
469 "paddh %[ftmp4], %[ftmp4], %[ff_pw_16] \n\t"
470 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
471 "paddh %[ftmp4], %[ftmp4], %[ftmp3] \n\t"
472 "paddh %[ftmp7], %[ftmp7], %[ftmp4] \n\t"
473 "psrah %[ftmp7], %[ftmp7], %[ftmp11] \n\t"
474 "packushb %[ftmp7], %[ftmp7], %[ftmp7] \n\t"
475 MMI_SWC1(%[ftmp7], %[
dst], 0x00)
476 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
478 : [ftmp0]
"=&f"(ftmp[0]), [ftmp1]
"=&f"(ftmp[1]),
479 [ftmp2]
"=&f"(ftmp[2]), [ftmp3]
"=&f"(ftmp[3]),
480 [ftmp4]
"=&f"(ftmp[4]), [ftmp5]
"=&f"(ftmp[5]),
481 [ftmp6]
"=&f"(ftmp[6]), [ftmp7]
"=&f"(ftmp[7]),
482 [ftmp8]
"=&f"(ftmp[8]), [ftmp9]
"=&f"(ftmp[9]),
483 [ftmp10]
"=&f"(ftmp[10]), [ftmp11]
"=&f"(ftmp[11]),
487 : [dstStride]
"r"((
mips_reg)dstStride),
488 [srcStride]
"r"((
mips_reg)srcStride),
495 int dstStride,
int srcStride)
503 src -= 2 * srcStride;
508 ".set noreorder \n\t"
509 "dli %[tmp0], 0x02 \n\t"
510 MMI_LWC1(%[ftmp0], %[
src], 0x00)
511 "mtc1 %[tmp0], %[ftmp8] \n\t"
512 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
513 "dli %[tmp0], 0x05 \n\t"
514 MMI_LWC1(%[ftmp1], %[
src], 0x00)
515 "mtc1 %[tmp0], %[ftmp9] \n\t"
516 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
517 MMI_LWC1(%[ftmp2], %[
src], 0x00)
518 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
519 "pxor %[ftmp7], %[ftmp7], %[ftmp7] \n\t"
520 MMI_LWC1(%[ftmp3], %[
src], 0x00)
521 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
522 MMI_LWC1(%[ftmp4], %[
src], 0x00)
523 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
524 "punpcklbh %[ftmp2], %[ftmp2], %[ftmp7] \n\t"
525 "punpcklbh %[ftmp3], %[ftmp3], %[ftmp7] \n\t"
526 MMI_LWC1(%[ftmp5], %[
src], 0x00)
527 "paddh %[ftmp6], %[ftmp2], %[ftmp3] \n\t"
528 "punpcklbh %[ftmp1], %[ftmp1], %[ftmp7] \n\t"
529 "psllh %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
530 "punpcklbh %[ftmp4], %[ftmp4], %[ftmp7] \n\t"
531 "psubh %[ftmp6], %[ftmp6], %[ftmp1] \n\t"
532 "punpcklbh %[ftmp0], %[ftmp0], %[ftmp7] \n\t"
533 "psubh %[ftmp6], %[ftmp6], %[ftmp4] \n\t"
534 "punpcklbh %[ftmp5], %[ftmp5], %[ftmp7] \n\t"
535 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
536 "paddh %[ftmp0], %[ftmp0], %[ff_pw_16] \n\t"
537 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
538 "paddh %[ftmp0], %[ftmp0], %[ftmp5] \n\t"
539 "paddh %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
540 "psrah %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
541 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
542 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
543 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
544 MMI_LWC1(%[ftmp0], %[
src], 0x00)
545 "paddh %[ftmp6], %[ftmp3], %[ftmp4] \n\t"
546 "psllh %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
547 "punpcklbh %[ftmp0], %[ftmp0], %[ftmp7] \n\t"
548 "psubh %[ftmp6], %[ftmp6], %[ftmp2] \n\t"
549 "paddh %[ftmp1], %[ftmp1], %[ff_pw_16] \n\t"
550 "psubh %[ftmp6], %[ftmp6], %[ftmp5] \n\t"
551 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
552 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
553 "paddh %[ftmp1], %[ftmp1], %[ftmp0] \n\t"
554 "paddh %[ftmp6], %[ftmp6], %[ftmp1] \n\t"
555 "psrah %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
556 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
557 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
558 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
559 "paddh %[ftmp6], %[ftmp4], %[ftmp5] \n\t"
560 MMI_LWC1(%[ftmp1], %[
src], 0x00)
561 "psllh %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
562 "psubh %[ftmp6], %[ftmp6], %[ftmp3] \n\t"
563 "punpcklbh %[ftmp1], %[ftmp1], %[ftmp7] \n\t"
564 "psubh %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
565 "paddh %[ftmp2], %[ftmp2], %[ff_pw_16] \n\t"
566 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
567 "paddh %[ftmp2], %[ftmp2], %[ftmp1] \n\t"
568 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
569 "paddh %[ftmp6], %[ftmp6], %[ftmp2] \n\t"
570 "psrah %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
571 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
572 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
573 "paddh %[ftmp6], %[ftmp5], %[ftmp0] \n\t"
574 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
575 "psllh %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
576 MMI_LWC1(%[ftmp2], %[
src], 0x00)
577 "psubh %[ftmp6], %[ftmp6], %[ftmp4] \n\t"
578 "psubh %[ftmp6], %[ftmp6], %[ftmp1] \n\t"
579 "punpcklbh %[ftmp2], %[ftmp2], %[ftmp7] \n\t"
580 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
581 "paddh %[ftmp3], %[ftmp3], %[ff_pw_16] \n\t"
582 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
583 "paddh %[ftmp3], %[ftmp3], %[ftmp2] \n\t"
584 "paddh %[ftmp6], %[ftmp6], %[ftmp3] \n\t"
585 "psrah %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
586 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
587 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
588 "paddh %[ftmp6], %[ftmp0], %[ftmp1] \n\t"
589 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
590 "psllh %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
591 MMI_LWC1(%[ftmp3], %[
src], 0x00)
592 "psubh %[ftmp6], %[ftmp6], %[ftmp5] \n\t"
593 "psubh %[ftmp6], %[ftmp6], %[ftmp2] \n\t"
594 "punpcklbh %[ftmp3] , %[ftmp3], %[ftmp7] \n\t"
595 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
596 "paddh %[ftmp4], %[ftmp4], %[ff_pw_16] \n\t"
597 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
598 "paddh %[ftmp4], %[ftmp4], %[ftmp3] \n\t"
599 "paddh %[ftmp6], %[ftmp6], %[ftmp4] \n\t"
600 "psrah %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
601 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
602 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
603 "paddh %[ftmp6], %[ftmp1], %[ftmp2] \n\t"
604 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
605 "psllh %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
606 MMI_LWC1(%[ftmp4], %[
src], 0x00)
607 "psubh %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
608 "psubh %[ftmp6], %[ftmp6], %[ftmp3] \n\t"
609 "punpcklbh %[ftmp4], %[ftmp4], %[ftmp7] \n\t"
610 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
611 "paddh %[ftmp5], %[ftmp5], %[ff_pw_16] \n\t"
612 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
613 "paddh %[ftmp5], %[ftmp5], %[ftmp4] \n\t"
614 "paddh %[ftmp6], %[ftmp6], %[ftmp5] \n\t"
615 "psrah %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
616 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
617 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
618 "paddh %[ftmp6], %[ftmp2], %[ftmp3] \n\t"
619 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
620 "psllh %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
621 MMI_LWC1(%[ftmp5], %[
src], 0x00)
622 "psubh %[ftmp6], %[ftmp6], %[ftmp1] \n\t"
623 "psubh %[ftmp6], %[ftmp6], %[ftmp4] \n\t"
624 "punpcklbh %[ftmp5], %[ftmp5], %[ftmp7] \n\t"
625 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
626 "paddh %[ftmp0], %[ftmp0], %[ff_pw_16] \n\t"
627 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
628 "paddh %[ftmp0], %[ftmp0], %[ftmp5] \n\t"
629 "paddh %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
630 "psrah %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
631 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
632 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
633 "paddh %[ftmp6], %[ftmp3], %[ftmp4] \n\t"
634 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
635 "psllh %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
636 MMI_LWC1(%[ftmp0], %[
src], 0x00)
637 "psubh %[ftmp6], %[ftmp6], %[ftmp2] \n\t"
638 "psubh %[ftmp6], %[ftmp6], %[ftmp5] \n\t"
639 "punpcklbh %[ftmp0], %[ftmp0], %[ftmp7] \n\t"
640 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
641 "paddh %[ftmp1], %[ftmp1], %[ff_pw_16] \n\t"
642 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
643 "paddh %[ftmp1], %[ftmp1], %[ftmp0] \n\t"
644 "paddh %[ftmp6], %[ftmp6], %[ftmp1] \n\t"
645 "psrah %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
646 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
647 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
648 "bne %[h], 0x10, 2f \n\t"
649 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
650 "paddh %[ftmp6], %[ftmp4], %[ftmp5] \n\t"
651 MMI_LWC1(%[ftmp1], %[
src], 0x00)
652 "psllh %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
653 "psubh %[ftmp6], %[ftmp6], %[ftmp3] \n\t"
654 "punpcklbh %[ftmp1], %[ftmp1], %[ftmp7] \n\t"
655 "psubh %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
656 "paddh %[ftmp2], %[ftmp2], %[ff_pw_16] \n\t"
657 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
658 "paddh %[ftmp2], %[ftmp2], %[ftmp1] \n\t"
659 "paddh %[ftmp6], %[ftmp6], %[ftmp2] \n\t"
660 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
661 "psrah %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
662 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
663 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
664 "paddh %[ftmp6], %[ftmp5], %[ftmp0] \n\t"
665 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
666 "psllh %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
667 MMI_LWC1(%[ftmp2], %[
src], 0x00)
668 "psubh %[ftmp6], %[ftmp6], %[ftmp4] \n\t"
669 "psubh %[ftmp6], %[ftmp6], %[ftmp1] \n\t"
670 "punpcklbh %[ftmp2], %[ftmp2], %[ftmp7] \n\t"
671 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
672 "paddh %[ftmp3], %[ftmp3], %[ff_pw_16] \n\t"
673 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
674 "paddh %[ftmp3], %[ftmp3], %[ftmp2] \n\t"
675 "paddh %[ftmp6], %[ftmp6], %[ftmp3] \n\t"
676 "psrah %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
677 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
678 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
679 "paddh %[ftmp6], %[ftmp0], %[ftmp1] \n\t"
680 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
681 "psllh %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
682 MMI_LWC1(%[ftmp3], %[
src], 0x00)
683 "psubh %[ftmp6], %[ftmp6], %[ftmp5] \n\t"
684 "psubh %[ftmp6], %[ftmp6], %[ftmp2] \n\t"
685 "punpcklbh %[ftmp3], %[ftmp3], %[ftmp7] \n\t"
686 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
687 "paddh %[ftmp4], %[ftmp4], %[ff_pw_16] \n\t"
688 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
689 "paddh %[ftmp4], %[ftmp4], %[ftmp3] \n\t"
690 "paddh %[ftmp6], %[ftmp6], %[ftmp4] \n\t"
691 "psrah %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
692 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
693 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
694 "paddh %[ftmp6], %[ftmp1], %[ftmp2] \n\t"
695 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
696 "psllh %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
697 MMI_LWC1(%[ftmp4], %[
src], 0x00)
698 "psubh %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
699 "psubh %[ftmp6], %[ftmp6], %[ftmp3] \n\t"
700 "punpcklbh %[ftmp4], %[ftmp4], %[ftmp7] \n\t"
701 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
702 "paddh %[ftmp5], %[ftmp5], %[ff_pw_16] \n\t"
703 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
704 "paddh %[ftmp5], %[ftmp5], %[ftmp4] \n\t"
705 "paddh %[ftmp6], %[ftmp6], %[ftmp5] \n\t"
706 "psrah %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
707 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
708 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
709 "paddh %[ftmp6], %[ftmp2], %[ftmp3] \n\t"
710 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
711 "psllh %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
712 MMI_LWC1(%[ftmp5], %[
src], 0x00)
713 "psubh %[ftmp6], %[ftmp6], %[ftmp1] \n\t"
714 "psubh %[ftmp6], %[ftmp6], %[ftmp4] \n\t"
715 "punpcklbh %[ftmp5], %[ftmp5], %[ftmp7] \n\t"
716 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
717 "paddh %[ftmp0], %[ftmp0], %[ff_pw_16] \n\t"
718 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
719 "paddh %[ftmp0], %[ftmp0], %[ftmp5] \n\t"
720 "paddh %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
721 "psrah %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
722 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
723 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
724 "paddh %[ftmp6], %[ftmp3], %[ftmp4] \n\t"
725 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
726 "psllh %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
727 MMI_LWC1(%[ftmp0], %[
src], 0x00)
728 "psubh %[ftmp6], %[ftmp6], %[ftmp2] \n\t"
729 "psubh %[ftmp6], %[ftmp6], %[ftmp5] \n\t"
730 "punpcklbh %[ftmp0], %[ftmp0], %[ftmp7] \n\t"
731 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
732 "paddh %[ftmp1], %[ftmp1], %[ff_pw_16] \n\t"
733 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
734 "paddh %[ftmp1], %[ftmp1], %[ftmp0] \n\t"
735 "paddh %[ftmp6], %[ftmp6], %[ftmp1] \n\t"
736 "psrah %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
737 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
738 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
739 "paddh %[ftmp6], %[ftmp4], %[ftmp5] \n\t"
740 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
741 "psllh %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
742 MMI_LWC1(%[ftmp1], %[
src], 0x00)
743 "psubh %[ftmp6], %[ftmp6], %[ftmp3] \n\t"
744 "psubh %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
745 "punpcklbh %[ftmp1], %[ftmp1], %[ftmp7] \n\t"
746 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
747 "paddh %[ftmp2], %[ftmp2], %[ff_pw_16] \n\t"
748 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
749 "paddh %[ftmp2], %[ftmp2], %[ftmp1] \n\t"
750 "paddh %[ftmp6], %[ftmp6], %[ftmp2] \n\t"
751 "psrah %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
752 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
753 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
754 "paddh %[ftmp6], %[ftmp5], %[ftmp0] \n\t"
755 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
756 "psllh %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
757 MMI_LWC1(%[ftmp2], %[
src], 0x00)
758 "psubh %[ftmp6], %[ftmp6], %[ftmp4] \n\t"
759 "psubh %[ftmp6], %[ftmp6], %[ftmp1] \n\t"
760 "punpcklbh %[ftmp2], %[ftmp2], %[ftmp7] \n\t"
761 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
762 "paddh %[ftmp3], %[ftmp3], %[ff_pw_16] \n\t"
763 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
764 "paddh %[ftmp3], %[ftmp3], %[ftmp2] \n\t"
765 "paddh %[ftmp6], %[ftmp6], %[ftmp3] \n\t"
766 "psrah %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
767 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
768 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
769 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
772 : [ftmp0]
"=&f"(ftmp[0]), [ftmp1]
"=&f"(ftmp[1]),
773 [ftmp2]
"=&f"(ftmp[2]), [ftmp3]
"=&f"(ftmp[3]),
774 [ftmp4]
"=&f"(ftmp[4]), [ftmp5]
"=&f"(ftmp[5]),
775 [ftmp6]
"=&f"(ftmp[6]), [ftmp7]
"=&f"(ftmp[7]),
776 [ftmp8]
"=&f"(ftmp[8]), [ftmp9]
"=&f"(ftmp[9]),
781 : [dstStride]
"r"((
mips_reg)dstStride),
782 [srcStride]
"r"((
mips_reg)srcStride),
787 src += 4 - (
h + 5) * srcStride;
788 dst += 4 -
h * dstStride;
793 int dstStride,
int srcStride)
804 int dstStride,
int srcStride)
809 src -= 2 * srcStride;
813 ".set noreorder \n\t"
814 "dli %[tmp0], 0x02 \n\t"
815 "pxor %[ftmp7], %[ftmp7], %[ftmp7] \n\t"
816 "mtc1 %[tmp0], %[ftmp9] \n\t"
817 "dli %[tmp0], 0x05 \n\t"
818 MMI_LWC1(%[ftmp0], %[
src], 0x00)
819 "mtc1 %[tmp0], %[ftmp8] \n\t"
820 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
821 MMI_LWC1(%[ftmp1], %[
src], 0x00)
822 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
823 MMI_LWC1(%[ftmp2], %[
src], 0x00)
824 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
825 MMI_LWC1(%[ftmp3], %[
src], 0x00)
826 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
827 MMI_LWC1(%[ftmp4], %[
src], 0x00)
828 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
829 "punpcklbh %[ftmp0], %[ftmp0], %[ftmp7] \n\t"
830 "punpcklbh %[ftmp1], %[ftmp1], %[ftmp7] \n\t"
831 "punpcklbh %[ftmp2], %[ftmp2], %[ftmp7] \n\t"
832 "punpcklbh %[ftmp3], %[ftmp3], %[ftmp7] \n\t"
833 "punpcklbh %[ftmp4], %[ftmp4], %[ftmp7] \n\t"
834 MMI_LWC1(%[ftmp5], %[
src], 0x00)
835 "paddh %[ftmp6], %[ftmp2], %[ftmp3] \n\t"
836 "psllh %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
837 "psubh %[ftmp6], %[ftmp6], %[ftmp1] \n\t"
838 "psubh %[ftmp6], %[ftmp6], %[ftmp4] \n\t"
839 "punpcklbh %[ftmp5], %[ftmp5], %[ftmp7] \n\t"
840 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
841 "paddh %[ftmp0], %[ftmp0], %[ff_pw_16] \n\t"
842 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
843 "paddh %[ftmp0], %[ftmp0], %[ftmp5] \n\t"
844 "paddh %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
845 "psrah %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
846 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
847 MMI_LWC1(%[ftmp0], %[
dst], 0x00)
848 "pavgb %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
849 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
850 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
851 MMI_LWC1(%[ftmp0], %[
src], 0x00)
852 "paddh %[ftmp6], %[ftmp3], %[ftmp4] \n\t"
853 "psllh %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
854 "psubh %[ftmp6], %[ftmp6], %[ftmp2] \n\t"
855 "psubh %[ftmp6], %[ftmp6], %[ftmp5] \n\t"
856 "punpcklbh %[ftmp0], %[ftmp0], %[ftmp7] \n\t"
857 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
858 "paddh %[ftmp1], %[ftmp1], %[ff_pw_16] \n\t"
859 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
860 "paddh %[ftmp1], %[ftmp1], %[ftmp0] \n\t"
861 "paddh %[ftmp6], %[ftmp6], %[ftmp1] \n\t"
862 "psrah %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
863 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
864 MMI_LWC1(%[ftmp1], %[
dst], 0x00)
865 "pavgb %[ftmp6], %[ftmp6], %[ftmp1] \n\t"
866 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
867 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
868 MMI_LWC1(%[ftmp1], %[
src], 0x00)
869 "paddh %[ftmp6], %[ftmp4], %[ftmp5] \n\t"
870 "psllh %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
871 "psubh %[ftmp6], %[ftmp6], %[ftmp3] \n\t"
872 "psubh %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
873 "punpcklbh %[ftmp1], %[ftmp1], %[ftmp7] \n\t"
874 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
875 "paddh %[ftmp2], %[ftmp2], %[ff_pw_16] \n\t"
876 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
877 "paddh %[ftmp2], %[ftmp2], %[ftmp1] \n\t"
878 "paddh %[ftmp6], %[ftmp6], %[ftmp2] \n\t"
879 "psrah %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
880 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
881 MMI_LWC1(%[ftmp2], %[
dst], 0x00)
882 "pavgb %[ftmp6], %[ftmp6], %[ftmp2] \n\t"
883 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
884 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
885 MMI_LWC1(%[ftmp2], %[
src], 0x00)
886 "paddh %[ftmp6], %[ftmp5], %[ftmp0] \n\t"
887 "psllh %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
888 "psubh %[ftmp6], %[ftmp6], %[ftmp4] \n\t"
889 "psubh %[ftmp6], %[ftmp6], %[ftmp1] \n\t"
890 "punpcklbh %[ftmp2], %[ftmp2], %[ftmp7] \n\t"
891 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
892 "paddh %[ftmp3], %[ftmp3], %[ff_pw_16] \n\t"
893 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
894 "paddh %[ftmp3], %[ftmp3], %[ftmp2] \n\t"
895 "paddh %[ftmp6], %[ftmp6], %[ftmp3] \n\t"
896 "psrah %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
897 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
898 MMI_LWC1(%[ftmp3], %[
dst], 0x00)
899 "pavgb %[ftmp6], %[ftmp6], %[ftmp3] \n\t"
900 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
901 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
903 : [ftmp0]
"=&f"(ftmp[0]), [ftmp1]
"=&f"(ftmp[1]),
904 [ftmp2]
"=&f"(ftmp[2]), [ftmp3]
"=&f"(ftmp[3]),
905 [ftmp4]
"=&f"(ftmp[4]), [ftmp5]
"=&f"(ftmp[5]),
906 [ftmp6]
"=&f"(ftmp[6]), [ftmp7]
"=&f"(ftmp[7]),
907 [ftmp8]
"=&f"(ftmp[8]), [ftmp9]
"=&f"(ftmp[9]),
910 : [dstStride]
"r"((
mips_reg)dstStride),
911 [srcStride]
"r"((
mips_reg)srcStride),
918 int dstStride,
int srcStride)
926 src -= 2 * srcStride;
931 ".set noreorder \n\t"
932 "dli %[tmp0], 0x02 \n\t"
933 "pxor %[ftmp7], %[ftmp7], %[ftmp7] \n\t"
934 "mtc1 %[tmp0], %[ftmp9] \n\t"
935 "dli %[tmp0], 0x05 \n\t"
936 MMI_LWC1(%[ftmp0], %[
src], 0x00)
937 "mtc1 %[tmp0], %[ftmp8] \n\t"
938 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
939 MMI_LWC1(%[ftmp1], %[
src], 0x00)
940 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
941 MMI_LWC1(%[ftmp2], %[
src], 0x00)
942 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
943 MMI_LWC1(%[ftmp3], %[
src], 0x00)
944 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
945 MMI_LWC1(%[ftmp4], %[
src], 0x00)
946 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
947 "punpcklbh %[ftmp0], %[ftmp0], %[ftmp7] \n\t"
948 "punpcklbh %[ftmp1], %[ftmp1], %[ftmp7] \n\t"
949 "punpcklbh %[ftmp2], %[ftmp2], %[ftmp7] \n\t"
950 "punpcklbh %[ftmp3], %[ftmp3], %[ftmp7] \n\t"
951 "punpcklbh %[ftmp4], %[ftmp4], %[ftmp7] \n\t"
952 MMI_LWC1(%[ftmp5], %[
src], 0x00)
953 "paddh %[ftmp6], %[ftmp2], %[ftmp3] \n\t"
954 "psllh %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
955 "psubh %[ftmp6], %[ftmp6], %[ftmp1] \n\t"
956 "psubh %[ftmp6], %[ftmp6], %[ftmp4] \n\t"
957 "punpcklbh %[ftmp5], %[ftmp5], %[ftmp7] \n\t"
958 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
959 "paddh %[ftmp0], %[ftmp0], %[ff_pw_16] \n\t"
960 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
961 "paddh %[ftmp0], %[ftmp0], %[ftmp5] \n\t"
962 "paddh %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
963 "psrah %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
964 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
965 MMI_LWC1(%[ftmp0], %[
dst], 0x00)
966 "pavgb %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
967 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
968 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
969 MMI_LWC1(%[ftmp0], %[
src], 0x00)
970 "paddh %[ftmp6], %[ftmp3], %[ftmp4] \n\t"
971 "psllh %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
972 "psubh %[ftmp6], %[ftmp6], %[ftmp2] \n\t"
973 "psubh %[ftmp6], %[ftmp6], %[ftmp5] \n\t"
974 "punpcklbh %[ftmp0], %[ftmp0], %[ftmp7] \n\t"
975 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
976 "paddh %[ftmp1], %[ftmp1], %[ff_pw_16] \n\t"
977 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
978 "paddh %[ftmp1], %[ftmp1], %[ftmp0] \n\t"
979 "paddh %[ftmp6], %[ftmp6], %[ftmp1] \n\t"
980 "psrah %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
981 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
982 MMI_LWC1(%[ftmp1], %[
dst], 0x00)
983 "pavgb %[ftmp6], %[ftmp6], %[ftmp1] \n\t"
984 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
985 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
986 MMI_LWC1(%[ftmp1], %[
src], 0x00)
987 "paddh %[ftmp6], %[ftmp4], %[ftmp5] \n\t"
988 "psllh %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
989 "psubh %[ftmp6], %[ftmp6], %[ftmp3] \n\t"
990 "psubh %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
991 "punpcklbh %[ftmp1], %[ftmp1], %[ftmp7] \n\t"
992 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
993 "paddh %[ftmp2], %[ftmp2], %[ff_pw_16] \n\t"
994 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
995 "paddh %[ftmp2], %[ftmp2], %[ftmp1] \n\t"
996 "paddh %[ftmp6], %[ftmp6], %[ftmp2] \n\t"
997 "psrah %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
998 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
999 MMI_LWC1(%[ftmp2], %[
dst], 0x00)
1000 "pavgb %[ftmp6], %[ftmp6], %[ftmp2] \n\t"
1001 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
1002 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
1003 MMI_LWC1(%[ftmp2], %[
src], 0x00)
1004 "paddh %[ftmp6], %[ftmp5], %[ftmp0] \n\t"
1005 "psllh %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
1006 "psubh %[ftmp6], %[ftmp6], %[ftmp4] \n\t"
1007 "psubh %[ftmp6], %[ftmp6], %[ftmp1] \n\t"
1008 "punpcklbh %[ftmp2], %[ftmp2], %[ftmp7] \n\t"
1009 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
1010 "paddh %[ftmp3], %[ftmp3], %[ff_pw_16] \n\t"
1011 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1012 "paddh %[ftmp3], %[ftmp3], %[ftmp2] \n\t"
1013 "paddh %[ftmp6], %[ftmp6], %[ftmp3] \n\t"
1014 "psrah %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
1015 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
1016 MMI_LWC1(%[ftmp3], %[
dst], 0x00)
1017 "pavgb %[ftmp6], %[ftmp6], %[ftmp3] \n\t"
1018 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
1019 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
1020 MMI_LWC1(%[ftmp3], %[
src], 0x00)
1021 "paddh %[ftmp6], %[ftmp0], %[ftmp1] \n\t"
1022 "psllh %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
1023 "psubh %[ftmp6], %[ftmp6], %[ftmp5] \n\t"
1024 "psubh %[ftmp6], %[ftmp6], %[ftmp2] \n\t"
1025 "punpcklbh %[ftmp3], %[ftmp3], %[ftmp7] \n\t"
1026 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
1027 "paddh %[ftmp4], %[ftmp4], %[ff_pw_16] \n\t"
1028 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1029 "paddh %[ftmp4], %[ftmp4], %[ftmp3] \n\t"
1030 "paddh %[ftmp6], %[ftmp6], %[ftmp4] \n\t"
1031 "psrah %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
1032 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
1033 MMI_LWC1(%[ftmp4], %[
dst], 0x00)
1034 "pavgb %[ftmp6], %[ftmp6], %[ftmp4] \n\t"
1035 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
1036 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
1037 MMI_LWC1(%[ftmp4], %[
src], 0x00)
1038 "paddh %[ftmp6], %[ftmp1], %[ftmp2] \n\t"
1039 "psllh %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
1040 "psubh %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
1041 "psubh %[ftmp6], %[ftmp6], %[ftmp3] \n\t"
1042 "punpcklbh %[ftmp4], %[ftmp4], %[ftmp7] \n\t"
1043 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
1044 "paddh %[ftmp5], %[ftmp5], %[ff_pw_16] \n\t"
1045 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1046 "paddh %[ftmp5], %[ftmp5], %[ftmp4] \n\t"
1047 "paddh %[ftmp6], %[ftmp6], %[ftmp5] \n\t"
1048 "psrah %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
1049 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
1050 MMI_LWC1(%[ftmp5], %[
dst], 0x00)
1051 "pavgb %[ftmp6], %[ftmp6], %[ftmp5] \n\t"
1052 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
1053 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
1054 MMI_LWC1(%[ftmp5], %[
src], 0x00)
1055 "paddh %[ftmp6], %[ftmp2], %[ftmp3] \n\t"
1056 "psllh %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
1057 "psubh %[ftmp6], %[ftmp6], %[ftmp1] \n\t"
1058 "psubh %[ftmp6], %[ftmp6], %[ftmp4] \n\t"
1059 "punpcklbh %[ftmp5], %[ftmp5], %[ftmp7] \n\t"
1060 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
1061 "paddh %[ftmp0], %[ftmp0], %[ff_pw_16] \n\t"
1062 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1063 "paddh %[ftmp0], %[ftmp0], %[ftmp5] \n\t"
1064 "paddh %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
1065 "psrah %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
1066 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
1067 MMI_LWC1(%[ftmp0], %[
dst], 0x00)
1068 "pavgb %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
1069 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
1070 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
1071 MMI_LWC1(%[ftmp0], %[
src], 0x00)
1072 "paddh %[ftmp6], %[ftmp3], %[ftmp4] \n\t"
1073 "psllh %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
1074 "psubh %[ftmp6], %[ftmp6], %[ftmp2] \n\t"
1075 "psubh %[ftmp6], %[ftmp6], %[ftmp5] \n\t"
1076 "punpcklbh %[ftmp0], %[ftmp0], %[ftmp7] \n\t"
1077 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
1078 "paddh %[ftmp1], %[ftmp1], %[ff_pw_16] \n\t"
1079 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1080 "paddh %[ftmp1], %[ftmp1], %[ftmp0] \n\t"
1081 "paddh %[ftmp6], %[ftmp6], %[ftmp1] \n\t"
1082 "psrah %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
1083 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
1084 MMI_LWC1(%[ftmp1], %[
dst], 0x00)
1085 "pavgb %[ftmp6], %[ftmp6], %[ftmp1] \n\t"
1086 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
1087 "bne %[h], 0x10, 2f \n\t"
1088 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
1089 MMI_LWC1(%[ftmp1], %[
src], 0x00)
1090 "paddh %[ftmp6], %[ftmp4], %[ftmp5] \n\t"
1091 "psllh %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
1092 "psubh %[ftmp6], %[ftmp6], %[ftmp3] \n\t"
1093 "psubh %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
1094 "punpcklbh %[ftmp1], %[ftmp1], %[ftmp7] \n\t"
1095 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
1096 "paddh %[ftmp2], %[ftmp2], %[ff_pw_16] \n\t"
1097 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1098 "paddh %[ftmp2], %[ftmp2], %[ftmp1] \n\t"
1099 "paddh %[ftmp6], %[ftmp6], %[ftmp2] \n\t"
1100 "psrah %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
1101 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
1102 MMI_LWC1(%[ftmp2], %[
dst], 0x00)
1103 "pavgb %[ftmp6], %[ftmp6], %[ftmp2] \n\t"
1104 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
1105 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
1106 MMI_LWC1(%[ftmp2], %[
src], 0x00)
1107 "paddh %[ftmp6], %[ftmp5], %[ftmp0] \n\t"
1108 "psllh %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
1109 "psubh %[ftmp6], %[ftmp6], %[ftmp4] \n\t"
1110 "psubh %[ftmp6], %[ftmp6], %[ftmp1] \n\t"
1111 "punpcklbh %[ftmp2], %[ftmp2], %[ftmp7] \n\t"
1112 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
1113 "paddh %[ftmp3], %[ftmp3], %[ff_pw_16] \n\t"
1114 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1115 "paddh %[ftmp3], %[ftmp3], %[ftmp2] \n\t"
1116 "paddh %[ftmp6], %[ftmp6], %[ftmp3] \n\t"
1117 "psrah %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
1118 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
1119 MMI_LWC1(%[ftmp3], %[
dst], 0x00)
1120 "pavgb %[ftmp6], %[ftmp6], %[ftmp3] \n\t"
1121 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
1122 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
1123 MMI_LWC1(%[ftmp3], %[
src], 0x00)
1124 "paddh %[ftmp6], %[ftmp0], %[ftmp1] \n\t"
1125 "psllh %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
1126 "psubh %[ftmp6], %[ftmp6], %[ftmp5] \n\t"
1127 "psubh %[ftmp6], %[ftmp6], %[ftmp2] \n\t"
1128 "punpcklbh %[ftmp3], %[ftmp3], %[ftmp7] \n\t"
1129 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
1130 "paddh %[ftmp4], %[ftmp4], %[ff_pw_16] \n\t"
1131 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1132 "paddh %[ftmp4], %[ftmp4], %[ftmp3] \n\t"
1133 "paddh %[ftmp6], %[ftmp6], %[ftmp4] \n\t"
1134 "psrah %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
1135 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
1136 MMI_LWC1(%[ftmp4], %[
dst], 0x00)
1137 "pavgb %[ftmp6], %[ftmp6], %[ftmp4] \n\t"
1138 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
1139 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
1140 MMI_LWC1(%[ftmp4], %[
src], 0x00)
1141 "paddh %[ftmp6], %[ftmp1], %[ftmp2] \n\t"
1142 "psllh %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
1143 "psubh %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
1144 "psubh %[ftmp6], %[ftmp6], %[ftmp3] \n\t"
1145 "punpcklbh %[ftmp4], %[ftmp4], %[ftmp7] \n\t"
1146 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
1147 "paddh %[ftmp5], %[ftmp5], %[ff_pw_16] \n\t"
1148 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1149 "paddh %[ftmp5], %[ftmp5], %[ftmp4] \n\t"
1150 "paddh %[ftmp6], %[ftmp6], %[ftmp5] \n\t"
1151 "psrah %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
1152 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
1153 MMI_LWC1(%[ftmp5], %[
dst], 0x00)
1154 "pavgb %[ftmp6], %[ftmp6], %[ftmp5] \n\t"
1155 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
1156 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
1157 MMI_LWC1(%[ftmp5], %[
src], 0x00)
1158 "paddh %[ftmp6], %[ftmp2], %[ftmp3] \n\t"
1159 "psllh %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
1160 "psubh %[ftmp6], %[ftmp6], %[ftmp1] \n\t"
1161 "psubh %[ftmp6], %[ftmp6], %[ftmp4] \n\t"
1162 "punpcklbh %[ftmp5], %[ftmp5], %[ftmp7] \n\t"
1163 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
1164 "paddh %[ftmp0], %[ftmp0], %[ff_pw_16] \n\t"
1165 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1166 "paddh %[ftmp0], %[ftmp0], %[ftmp5] \n\t"
1167 "paddh %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
1168 "psrah %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
1169 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
1170 MMI_LWC1(%[ftmp0], %[
dst], 0x00)
1171 "pavgb %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
1172 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
1173 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
1174 MMI_LWC1(%[ftmp0], %[
src], 0x00)
1175 "paddh %[ftmp6], %[ftmp3], %[ftmp4] \n\t"
1176 "psllh %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
1177 "psubh %[ftmp6], %[ftmp6], %[ftmp2] \n\t"
1178 "psubh %[ftmp6], %[ftmp6], %[ftmp5] \n\t"
1179 "punpcklbh %[ftmp0], %[ftmp0], %[ftmp7] \n\t"
1180 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
1181 "paddh %[ftmp1], %[ftmp1], %[ff_pw_16] \n\t"
1182 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1183 "paddh %[ftmp1], %[ftmp1], %[ftmp0] \n\t"
1184 "paddh %[ftmp6], %[ftmp6], %[ftmp1] \n\t"
1185 "psrah %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
1186 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
1187 MMI_LWC1(%[ftmp1], %[
dst], 0x00)
1188 "pavgb %[ftmp6], %[ftmp6], %[ftmp1] \n\t"
1189 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
1190 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
1191 MMI_LWC1(%[ftmp1], %[
src], 0x00)
1192 "paddh %[ftmp6], %[ftmp4], %[ftmp5] \n\t"
1193 "psllh %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
1194 "psubh %[ftmp6], %[ftmp6], %[ftmp3] \n\t"
1195 "psubh %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
1196 "punpcklbh %[ftmp1], %[ftmp1], %[ftmp7] \n\t"
1197 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
1198 "paddh %[ftmp2], %[ftmp2], %[ff_pw_16] \n\t"
1199 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1200 "paddh %[ftmp2], %[ftmp2], %[ftmp1] \n\t"
1201 "paddh %[ftmp6], %[ftmp6], %[ftmp2] \n\t"
1202 "psrah %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
1203 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
1204 MMI_LWC1(%[ftmp2], %[
dst], 0x00)
1205 "pavgb %[ftmp6], %[ftmp6], %[ftmp2] \n\t"
1206 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
1207 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
1208 MMI_LWC1(%[ftmp2], %[
src], 0x00)
1209 "paddh %[ftmp6], %[ftmp5], %[ftmp0] \n\t"
1210 "psllh %[ftmp6], %[ftmp6], %[ftmp9] \n\t"
1211 "psubh %[ftmp6], %[ftmp6], %[ftmp4] \n\t"
1212 "psubh %[ftmp6], %[ftmp6], %[ftmp1] \n\t"
1213 "punpcklbh %[ftmp2], %[ftmp2], %[ftmp7] \n\t"
1214 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
1215 "paddh %[ftmp3], %[ftmp3], %[ff_pw_16] \n\t"
1216 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1217 "paddh %[ftmp3], %[ftmp3], %[ftmp2] \n\t"
1218 "paddh %[ftmp6], %[ftmp6], %[ftmp3] \n\t"
1219 "psrah %[ftmp6], %[ftmp6], %[ftmp8] \n\t"
1220 "packushb %[ftmp6], %[ftmp6], %[ftmp6] \n\t"
1221 MMI_LWC1(%[ftmp3], %[
dst], 0x00)
1222 "pavgb %[ftmp6], %[ftmp6], %[ftmp3] \n\t"
1223 MMI_SWC1(%[ftmp6], %[
dst], 0x00)
1224 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
1227 : [ftmp0]
"=&f"(ftmp[0]), [ftmp1]
"=&f"(ftmp[1]),
1228 [ftmp2]
"=&f"(ftmp[2]), [ftmp3]
"=&f"(ftmp[3]),
1229 [ftmp4]
"=&f"(ftmp[4]), [ftmp5]
"=&f"(ftmp[5]),
1230 [ftmp6]
"=&f"(ftmp[6]), [ftmp7]
"=&f"(ftmp[7]),
1231 [ftmp8]
"=&f"(ftmp[8]), [ftmp9]
"=&f"(ftmp[9]),
1232 [tmp0]
"=&r"(
tmp[0]),
1236 : [dstStride]
"r"((
mips_reg)dstStride),
1237 [srcStride]
"r"((
mips_reg)srcStride),
1242 src += 4 - (
h + 5) * srcStride;
1243 dst += 4 -
h * dstStride;
1248 int dstStride,
int srcStride)
1259 int dstStride,
int srcStride)
1263 int16_t *
tmp = _tmp;
1271 "pxor %[ftmp0], %[ftmp0], %[ftmp0] \n\t"
1272 "dli %[tmp0], 0x09 \n\t"
1274 MMI_ULWC1(%[ftmp1], %[
src], -0x02)
1275 MMI_ULWC1(%[ftmp2], %[
src], -0x01)
1276 MMI_ULWC1(%[ftmp3], %[
src], 0x00)
1277 MMI_ULWC1(%[ftmp4], %[
src], 0x01)
1278 MMI_ULWC1(%[ftmp5], %[
src], 0x02)
1279 MMI_ULWC1(%[ftmp6], %[
src], 0x03)
1280 "punpcklbh %[ftmp1], %[ftmp1], %[ftmp0] \n\t"
1281 "punpcklbh %[ftmp2], %[ftmp2], %[ftmp0] \n\t"
1282 "punpcklbh %[ftmp3], %[ftmp3], %[ftmp0] \n\t"
1283 "punpcklbh %[ftmp4], %[ftmp4], %[ftmp0] \n\t"
1284 "punpcklbh %[ftmp5], %[ftmp5], %[ftmp0] \n\t"
1285 "punpcklbh %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
1286 "paddsh %[ftmp7], %[ftmp3], %[ftmp4] \n\t"
1287 "paddsh %[ftmp8], %[ftmp2], %[ftmp5] \n\t"
1288 "paddsh %[ftmp9], %[ftmp1], %[ftmp6] \n\t"
1289 "pmullh %[ftmp7], %[ftmp7], %[ff_pw_20] \n\t"
1290 "pmullh %[ftmp8], %[ftmp8], %[ff_pw_5] \n\t"
1291 "psubsh %[ftmp7], %[ftmp7], %[ftmp8] \n\t"
1292 "paddsh %[ftmp9], %[ftmp7], %[ftmp9] \n\t"
1293 MMI_SDC1(%[ftmp9], %[
tmp], 0x00)
1294 "daddi %[tmp0], %[tmp0], -0x01 \n\t"
1295 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1296 PTR_ADDU "%[tmp], %[tmp], %[tmpStride] \n\t"
1297 "bnez %[tmp0], 1b \n\t"
1298 : [ftmp0]
"=&f"(ftmp[0]), [ftmp1]
"=&f"(ftmp[1]),
1299 [ftmp2]
"=&f"(ftmp[2]), [ftmp3]
"=&f"(ftmp[3]),
1300 [ftmp4]
"=&f"(ftmp[4]), [ftmp5]
"=&f"(ftmp[5]),
1301 [ftmp6]
"=&f"(ftmp[6]), [ftmp7]
"=&f"(ftmp[7]),
1302 [ftmp8]
"=&f"(ftmp[8]), [ftmp9]
"=&f"(ftmp[9]),
1306 : [tmpStride]
"r"(8),
1307 [srcStride]
"r"((
mips_reg)srcStride),
1314 for (
i=0;
i<4;
i++) {
1315 const int16_t tmpB=
tmp[-8];
1316 const int16_t tmpA=
tmp[-4];
1317 const int16_t tmp0=
tmp[ 0];
1318 const int16_t tmp1=
tmp[ 4];
1319 const int16_t tmp2=
tmp[ 8];
1320 const int16_t tmp3=
tmp[12];
1321 const int16_t tmp4=
tmp[16];
1322 const int16_t tmp5=
tmp[20];
1323 const int16_t tmp6=
tmp[24];
1324 op2_put(
dst[0*dstStride], (tmp0+tmp1)*20 - (tmpA+tmp2)*5 + (tmpB+tmp3));
1325 op2_put(
dst[1*dstStride], (tmp1+tmp2)*20 - (tmp0+tmp3)*5 + (tmpA+tmp4));
1326 op2_put(
dst[2*dstStride], (tmp2+tmp3)*20 - (tmp1+tmp4)*5 + (tmp0+tmp5));
1327 op2_put(
dst[3*dstStride], (tmp3+tmp4)*20 - (tmp2+tmp5)*5 + (tmp1+tmp6));
1334 const uint8_t *
src, ptrdiff_t tmpStride, ptrdiff_t srcStride,
int size)
1336 int w = (
size + 8) >> 2;
1341 src -= 2 * srcStride + 2;
1345 "dli %[tmp0], 0x02 \n\t"
1346 MMI_ULWC1(%[ftmp0], %[
src], 0x00)
1347 "mtc1 %[tmp0], %[ftmp10] \n\t"
1348 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1349 "pxor %[ftmp7], %[ftmp7], %[ftmp7] \n\t"
1350 MMI_ULWC1(%[ftmp1], %[
src], 0x00)
1351 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1352 MMI_ULWC1(%[ftmp2], %[
src], 0x00)
1353 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1354 MMI_ULWC1(%[ftmp3], %[
src], 0x00)
1355 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1356 MMI_ULWC1(%[ftmp4], %[
src], 0x00)
1357 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1358 "punpcklbh %[ftmp0], %[ftmp0], %[ftmp7] \n\t"
1359 "punpcklbh %[ftmp1], %[ftmp1], %[ftmp7] \n\t"
1360 "punpcklbh %[ftmp2], %[ftmp2], %[ftmp7] \n\t"
1361 "punpcklbh %[ftmp3], %[ftmp3], %[ftmp7] \n\t"
1362 "punpcklbh %[ftmp4], %[ftmp4], %[ftmp7] \n\t"
1363 MMI_ULWC1(%[ftmp5], %[
src], 0x00)
1364 "paddh %[ftmp6], %[ftmp2], %[ftmp3] \n\t"
1365 "psllh %[ftmp6], %[ftmp6], %[ftmp10] \n\t"
1366 "paddh %[ftmp0], %[ftmp0], %[ff_pw_16] \n\t"
1367 "psubh %[ftmp6], %[ftmp6], %[ftmp1] \n\t"
1368 "psubh %[ftmp6], %[ftmp6], %[ftmp4] \n\t"
1369 "punpcklbh %[ftmp5], %[ftmp5], %[ftmp7] \n\t"
1370 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
1371 "paddh %[ftmp0], %[ftmp0], %[ftmp5] \n\t"
1372 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1373 "paddh %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
1374 MMI_SDC1(%[ftmp6], %[
tmp], 0x00)
1375 MMI_ULWC1(%[ftmp0], %[
src], 0x00)
1376 "paddh %[ftmp6], %[ftmp3], %[ftmp4] \n\t"
1377 "psllh %[ftmp6], %[ftmp6], %[ftmp10] \n\t"
1378 "paddh %[ftmp1], %[ftmp1], %[ff_pw_16] \n\t"
1379 "psubh %[ftmp6], %[ftmp6], %[ftmp2] \n\t"
1380 "psubh %[ftmp6], %[ftmp6], %[ftmp5] \n\t"
1381 "punpcklbh %[ftmp0], %[ftmp0], %[ftmp7] \n\t"
1382 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
1383 "paddh %[ftmp1], %[ftmp1], %[ftmp0] \n\t"
1384 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1385 "paddh %[ftmp6], %[ftmp6], %[ftmp1] \n\t"
1386 MMI_SDC1(%[ftmp6], %[
tmp], 0x30)
1387 MMI_ULWC1(%[ftmp1], %[
src], 0x00)
1388 "paddh %[ftmp6], %[ftmp4], %[ftmp5] \n\t"
1389 "psllh %[ftmp6], %[ftmp6], %[ftmp10] \n\t"
1390 "paddh %[ftmp2], %[ftmp2], %[ff_pw_16] \n\t"
1391 "psubh %[ftmp6], %[ftmp6], %[ftmp3] \n\t"
1392 "psubh %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
1393 "punpcklbh %[ftmp1], %[ftmp1], %[ftmp7] \n\t"
1394 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
1395 "paddh %[ftmp2], %[ftmp2], %[ftmp1] \n\t"
1396 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1397 "paddh %[ftmp6], %[ftmp6], %[ftmp2] \n\t"
1398 MMI_SDC1(%[ftmp6], %[
tmp], 0x60)
1399 MMI_ULWC1(%[ftmp2], %[
src], 0x00)
1400 "paddh %[ftmp6], %[ftmp5], %[ftmp0] \n\t"
1401 "psllh %[ftmp6], %[ftmp6], %[ftmp10] \n\t"
1402 "paddh %[ftmp3], %[ftmp3], %[ff_pw_16] \n\t"
1403 "psubh %[ftmp6], %[ftmp6], %[ftmp4] \n\t"
1404 "psubh %[ftmp6], %[ftmp6], %[ftmp1] \n\t"
1405 "punpcklbh %[ftmp2], %[ftmp2], %[ftmp7] \n\t"
1406 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
1407 "paddh %[ftmp3], %[ftmp3], %[ftmp2] \n\t"
1408 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1409 "paddh %[ftmp6], %[ftmp6], %[ftmp3] \n\t"
1410 MMI_SDC1(%[ftmp6], %[
tmp], 0x90)
1411 MMI_ULWC1(%[ftmp3], %[
src], 0x00)
1412 "paddh %[ftmp6], %[ftmp0], %[ftmp1] \n\t"
1413 "psllh %[ftmp6], %[ftmp6], %[ftmp10] \n\t"
1414 "paddh %[ftmp4], %[ftmp4], %[ff_pw_16] \n\t"
1415 "psubh %[ftmp6], %[ftmp6], %[ftmp5] \n\t"
1416 "psubh %[ftmp6], %[ftmp6], %[ftmp2] \n\t"
1417 "punpcklbh %[ftmp3], %[ftmp3], %[ftmp7] \n\t"
1418 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
1419 "paddh %[ftmp4], %[ftmp4], %[ftmp3] \n\t"
1420 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1421 "paddh %[ftmp6], %[ftmp6], %[ftmp4] \n\t"
1422 MMI_SDC1(%[ftmp6], %[
tmp], 0xc0)
1423 MMI_ULWC1(%[ftmp4], %[
src], 0x00)
1424 "paddh %[ftmp6], %[ftmp1], %[ftmp2] \n\t"
1425 "psllh %[ftmp6], %[ftmp6], %[ftmp10] \n\t"
1426 "paddh %[ftmp5], %[ftmp5], %[ff_pw_16] \n\t"
1427 "psubh %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
1428 "psubh %[ftmp6], %[ftmp6], %[ftmp3] \n\t"
1429 "punpcklbh %[ftmp4], %[ftmp4], %[ftmp7] \n\t"
1430 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
1431 "paddh %[ftmp5], %[ftmp5], %[ftmp4] \n\t"
1432 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1433 "paddh %[ftmp6], %[ftmp6], %[ftmp5] \n\t"
1434 MMI_SDC1(%[ftmp6], %[
tmp], 0xf0)
1435 MMI_ULWC1(%[ftmp5], %[
src], 0x00)
1436 "paddh %[ftmp6], %[ftmp2], %[ftmp3] \n\t"
1437 "psllh %[ftmp6], %[ftmp6], %[ftmp10] \n\t"
1438 "paddh %[ftmp0], %[ftmp0], %[ff_pw_16] \n\t"
1439 "psubh %[ftmp6], %[ftmp6], %[ftmp1] \n\t"
1440 "psubh %[ftmp6], %[ftmp6], %[ftmp4] \n\t"
1441 "punpcklbh %[ftmp5], %[ftmp5], %[ftmp7] \n\t"
1442 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
1443 "paddh %[ftmp0], %[ftmp0], %[ftmp5] \n\t"
1444 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1445 "paddh %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
1446 MMI_SDC1(%[ftmp6], %[
tmp], 0x120)
1447 MMI_ULWC1(%[ftmp0], %[
src], 0x00)
1448 "paddh %[ftmp6], %[ftmp3], %[ftmp4] \n\t"
1449 "psllh %[ftmp6], %[ftmp6], %[ftmp10] \n\t"
1450 "paddh %[ftmp1], %[ftmp1], %[ff_pw_16] \n\t"
1451 "psubh %[ftmp6], %[ftmp6], %[ftmp2] \n\t"
1452 "psubh %[ftmp6], %[ftmp6], %[ftmp5] \n\t"
1453 "punpcklbh %[ftmp0], %[ftmp0], %[ftmp7] \n\t"
1454 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
1455 "paddh %[ftmp1], %[ftmp1], %[ftmp0] \n\t"
1456 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1457 "paddh %[ftmp6], %[ftmp6], %[ftmp1] \n\t"
1458 MMI_SDC1(%[ftmp6], %[
tmp], 0x150)
1459 "bne %[size], 0x10, 2f \n\t"
1461 MMI_ULWC1(%[ftmp1], %[
src], 0x00)
1462 "paddh %[ftmp6], %[ftmp4], %[ftmp5] \n\t"
1463 "psllh %[ftmp6], %[ftmp6], %[ftmp10] \n\t"
1464 "paddh %[ftmp2], %[ftmp2], %[ff_pw_16] \n\t"
1465 "psubh %[ftmp6], %[ftmp6], %[ftmp3] \n\t"
1466 "psubh %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
1467 "punpcklbh %[ftmp1], %[ftmp1], %[ftmp7] \n\t"
1468 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
1469 "paddh %[ftmp2], %[ftmp2], %[ftmp1] \n\t"
1470 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1471 "paddh %[ftmp6], %[ftmp6], %[ftmp2] \n\t"
1472 MMI_SDC1(%[ftmp6], %[
tmp], 0x180)
1473 MMI_ULWC1(%[ftmp2], %[
src], 0x00)
1474 "paddh %[ftmp6], %[ftmp5], %[ftmp0] \n\t"
1475 "psllh %[ftmp6], %[ftmp6], %[ftmp10] \n\t"
1476 "paddh %[ftmp3], %[ftmp3], %[ff_pw_16] \n\t"
1477 "psubh %[ftmp6], %[ftmp6], %[ftmp4] \n\t"
1478 "psubh %[ftmp6], %[ftmp6], %[ftmp1] \n\t"
1479 "punpcklbh %[ftmp2], %[ftmp2], %[ftmp7] \n\t"
1480 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
1481 "paddh %[ftmp3], %[ftmp3], %[ftmp2] \n\t"
1482 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1483 "paddh %[ftmp6], %[ftmp6], %[ftmp3] \n\t"
1484 MMI_SDC1(%[ftmp6], %[
tmp], 0x1b0)
1485 MMI_ULWC1(%[ftmp3], %[
src], 0x00)
1486 "paddh %[ftmp6], %[ftmp0], %[ftmp1] \n\t"
1487 "psllh %[ftmp6], %[ftmp6], %[ftmp10] \n\t"
1488 "paddh %[ftmp4], %[ftmp4], %[ff_pw_16] \n\t"
1489 "psubh %[ftmp6], %[ftmp6], %[ftmp5] \n\t"
1490 "psubh %[ftmp6], %[ftmp6], %[ftmp2] \n\t"
1491 "punpcklbh %[ftmp3], %[ftmp3], %[ftmp7] \n\t"
1492 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
1493 "paddh %[ftmp4], %[ftmp4], %[ftmp3] \n\t"
1494 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1495 "paddh %[ftmp6], %[ftmp6], %[ftmp4] \n\t"
1496 MMI_SDC1(%[ftmp6], %[
tmp], 0x1e0)
1497 MMI_ULWC1(%[ftmp4], %[
src], 0x00)
1498 "paddh %[ftmp6], %[ftmp1], %[ftmp2] \n\t"
1499 "psllh %[ftmp6], %[ftmp6], %[ftmp10] \n\t"
1500 "paddh %[ftmp5], %[ftmp5], %[ff_pw_16] \n\t"
1501 "psubh %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
1502 "psubh %[ftmp6], %[ftmp6], %[ftmp3] \n\t"
1503 "punpcklbh %[ftmp4], %[ftmp4], %[ftmp7] \n\t"
1504 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
1505 "paddh %[ftmp5], %[ftmp5], %[ftmp4] \n\t"
1506 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1507 "paddh %[ftmp6], %[ftmp6], %[ftmp5] \n\t"
1508 MMI_SDC1(%[ftmp6], %[
tmp], 0x210)
1509 MMI_ULWC1(%[ftmp5], %[
src], 0x00)
1510 "paddh %[ftmp6], %[ftmp2], %[ftmp3] \n\t"
1511 "psllh %[ftmp6], %[ftmp6], %[ftmp10] \n\t"
1512 "paddh %[ftmp0], %[ftmp0], %[ff_pw_16] \n\t"
1513 "psubh %[ftmp6], %[ftmp6], %[ftmp1] \n\t"
1514 "psubh %[ftmp6], %[ftmp6], %[ftmp4] \n\t"
1515 "punpcklbh %[ftmp5], %[ftmp5], %[ftmp7] \n\t"
1516 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
1517 "paddh %[ftmp0], %[ftmp0], %[ftmp5] \n\t"
1518 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1519 "paddh %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
1520 MMI_SDC1(%[ftmp6], %[
tmp], 0x240)
1521 MMI_ULWC1(%[ftmp0], %[
src], 0x00)
1522 "paddh %[ftmp6], %[ftmp3], %[ftmp4] \n\t"
1523 "psllh %[ftmp6], %[ftmp6], %[ftmp10] \n\t"
1524 "paddh %[ftmp1], %[ftmp1], %[ff_pw_16] \n\t"
1525 "psubh %[ftmp6], %[ftmp6], %[ftmp2] \n\t"
1526 "psubh %[ftmp6], %[ftmp6], %[ftmp5] \n\t"
1527 "punpcklbh %[ftmp0], %[ftmp0], %[ftmp7] \n\t"
1528 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
1529 "paddh %[ftmp1], %[ftmp1], %[ftmp0] \n\t"
1530 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1531 "paddh %[ftmp6], %[ftmp6], %[ftmp1] \n\t"
1532 MMI_SDC1(%[ftmp6], %[
tmp], 0x270)
1533 MMI_ULWC1(%[ftmp1], %[
src], 0x00)
1534 "paddh %[ftmp6], %[ftmp4], %[ftmp5] \n\t"
1535 "psllh %[ftmp6], %[ftmp6], %[ftmp10] \n\t"
1536 "paddh %[ftmp2], %[ftmp2], %[ff_pw_16] \n\t"
1537 "psubh %[ftmp6], %[ftmp6], %[ftmp3] \n\t"
1538 "psubh %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
1539 "punpcklbh %[ftmp1], %[ftmp1], %[ftmp7] \n\t"
1540 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
1541 "paddh %[ftmp2], %[ftmp2], %[ftmp1] \n\t"
1542 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1543 "paddh %[ftmp6], %[ftmp6], %[ftmp2] \n\t"
1544 MMI_SDC1(%[ftmp6], %[
tmp], 0x2a0)
1545 MMI_ULWC1(%[ftmp2], %[
src], 0x00)
1546 "paddh %[ftmp6], %[ftmp5], %[ftmp0] \n\t"
1547 "psllh %[ftmp6], %[ftmp6], %[ftmp10] \n\t"
1548 "paddh %[ftmp3], %[ftmp3], %[ff_pw_16] \n\t"
1549 "psubh %[ftmp6], %[ftmp6], %[ftmp4] \n\t"
1550 "psubh %[ftmp6], %[ftmp6], %[ftmp1] \n\t"
1551 "punpcklbh %[ftmp2], %[ftmp2], %[ftmp7] \n\t"
1552 "pmullh %[ftmp6], %[ftmp6], %[ff_pw_5] \n\t"
1553 "paddh %[ftmp3], %[ftmp3], %[ftmp2] \n\t"
1554 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1555 "paddh %[ftmp6], %[ftmp6], %[ftmp3] \n\t"
1556 MMI_SDC1(%[ftmp6], %[
tmp], 0x2d0)
1558 : [ftmp0]
"=&f"(ftmp[0]), [ftmp1]
"=&f"(ftmp[1]),
1559 [ftmp2]
"=&f"(ftmp[2]), [ftmp3]
"=&f"(ftmp[3]),
1560 [ftmp4]
"=&f"(ftmp[4]), [ftmp5]
"=&f"(ftmp[5]),
1561 [ftmp6]
"=&f"(ftmp[6]), [ftmp7]
"=&f"(ftmp[7]),
1562 [ftmp8]
"=&f"(ftmp[8]), [ftmp9]
"=&f"(ftmp[9]),
1563 [ftmp10]
"=&f"(ftmp[10]),
1568 [srcStride]
"r"((
mips_reg)srcStride),
1574 src += 4 - (
size + 5) * srcStride;
1579 int16_t *
tmp, ptrdiff_t dstStride, ptrdiff_t tmpStride,
int size)
1590 "dli %[tmp0], 0x02 \n\t"
1591 "mtc1 %[tmp0], %[ftmp8] \n\t"
1592 "dli %[tmp0], 0x06 \n\t"
1593 "mtc1 %[tmp0], %[ftmp9] \n\t"
1595 MMI_LDC1(%[ftmp0], %[
tmp], 0x00)
1596 MMI_LDC1(%[ftmp3], %[
tmp], 0x08)
1597 MMI_LDC1(%[ftmp6], %[
tmp], 0x10)
1598 MMI_ULDC1(%[ftmp1], %[
tmp], 0x02)
1599 MMI_ULDC1(%[ftmp4], %[
tmp], 0x0a)
1600 MMI_ULDC1(%[ftmp5], %[
tmp], 0x12)
1601 "paddh %[ftmp0], %[ftmp0], %[ftmp4] \n\t"
1602 "paddh %[ftmp1], %[ftmp1], %[ftmp3] \n\t"
1603 "paddh %[ftmp3], %[ftmp3], %[ftmp5] \n\t"
1604 "paddh %[ftmp4], %[ftmp4], %[ftmp6] \n\t"
1605 MMI_ULDC1(%[ftmp2], %[
tmp], 0x04)
1606 MMI_ULDC1(%[ftmp6], %[
tmp], 0x06)
1607 MMI_ULDC1(%[ftmp5], %[
tmp], 0x0c)
1608 MMI_ULDC1(%[ftmp7], %[
tmp], 0x0e)
1609 "paddh %[ftmp2], %[ftmp2], %[ftmp6] \n\t"
1610 "paddh %[ftmp5], %[ftmp5], %[ftmp7] \n\t"
1611 "psubh %[ftmp0], %[ftmp0], %[ftmp1] \n\t"
1612 "psubh %[ftmp3], %[ftmp3], %[ftmp4] \n\t"
1613 "psrah %[ftmp0], %[ftmp0], %[ftmp8] \n\t"
1614 "psrah %[ftmp3], %[ftmp3], %[ftmp8] \n\t"
1615 "psubh %[ftmp0], %[ftmp0], %[ftmp1] \n\t"
1616 "psubh %[ftmp3], %[ftmp3], %[ftmp4] \n\t"
1617 "paddsh %[ftmp0], %[ftmp0], %[ftmp2] \n\t"
1618 "paddsh %[ftmp3] , %[ftmp3], %[ftmp5] \n\t"
1619 "psrah %[ftmp0], %[ftmp0], %[ftmp8] \n\t"
1620 "psrah %[ftmp3], %[ftmp3], %[ftmp8] \n\t"
1621 "paddh %[ftmp0], %[ftmp0], %[ftmp2] \n\t"
1622 "paddh %[ftmp3], %[ftmp3], %[ftmp5] \n\t"
1623 "psrah %[ftmp0], %[ftmp0], %[ftmp9] \n\t"
1624 "psrah %[ftmp3], %[ftmp3], %[ftmp9] \n\t"
1625 "packushb %[ftmp0], %[ftmp0], %[ftmp3] \n\t"
1626 "addi %[h], %[h], -0x01 \n\t"
1627 MMI_SDC1(%[ftmp0], %[
dst], 0x00)
1629 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
1630 "bnez %[h], 1b \n\t"
1631 : [ftmp0]
"=&f"(ftmp[0]), [ftmp1]
"=&f"(ftmp[1]),
1632 [ftmp2]
"=&f"(ftmp[2]), [ftmp3]
"=&f"(ftmp[3]),
1633 [ftmp4]
"=&f"(ftmp[4]), [ftmp5]
"=&f"(ftmp[5]),
1634 [ftmp6]
"=&f"(ftmp[6]), [ftmp7]
"=&f"(ftmp[7]),
1635 [ftmp8]
"=&f"(ftmp[8]), [ftmp9]
"=&f"(ftmp[9]),
1640 : [dstStride]
"r"((
mips_reg)dstStride)
1650 const uint8_t *
src, ptrdiff_t dstStride, ptrdiff_t tmpStride,
1651 ptrdiff_t srcStride,
int size)
1658 const uint8_t *
src, ptrdiff_t dstStride, ptrdiff_t tmpStride,
1659 ptrdiff_t srcStride)
1666 const uint8_t *
src, ptrdiff_t dstStride, ptrdiff_t tmpStride,
1667 ptrdiff_t srcStride)
1674 const uint8_t *
src2, ptrdiff_t dstStride, ptrdiff_t src2Stride)
1683 "dli %[tmp0], 0x02 \n\t"
1684 "mtc1 %[tmp0], %[ftmp7] \n\t"
1685 "dli %[tmp0], 0x05 \n\t"
1686 "pxor %[ftmp0], %[ftmp0], %[ftmp0] \n\t"
1687 "mtc1 %[tmp0], %[ftmp8] \n\t"
1689 MMI_ULDC1(%[ftmp1], %[
src], 0x00)
1690 MMI_ULDC1(%[ftmp3], %[
src], 0x01)
1691 "punpckhbh %[ftmp2], %[ftmp1], %[ftmp0] \n\t"
1692 "punpcklbh %[ftmp1], %[ftmp1], %[ftmp0] \n\t"
1693 "punpckhbh %[ftmp4], %[ftmp3], %[ftmp0] \n\t"
1694 "punpcklbh %[ftmp3], %[ftmp3], %[ftmp0] \n\t"
1695 "paddh %[ftmp2], %[ftmp2], %[ftmp4] \n\t"
1696 "paddh %[ftmp1], %[ftmp1], %[ftmp3] \n\t"
1697 "psllh %[ftmp2], %[ftmp2], %[ftmp7] \n\t"
1698 "psllh %[ftmp1], %[ftmp1], %[ftmp7] \n\t"
1699 MMI_ULDC1(%[ftmp3], %[
src], -0x01)
1700 MMI_ULDC1(%[ftmp5], %[
src], 0x02)
1701 "punpckhbh %[ftmp4], %[ftmp3], %[ftmp0] \n\t"
1702 "punpcklbh %[ftmp3], %[ftmp3], %[ftmp0] \n\t"
1703 "punpckhbh %[ftmp6], %[ftmp5], %[ftmp0] \n\t"
1704 "punpcklbh %[ftmp5], %[ftmp5], %[ftmp0] \n\t"
1705 "paddh %[ftmp6], %[ftmp6], %[ftmp4] \n\t"
1706 "paddh %[ftmp3], %[ftmp3], %[ftmp5] \n\t"
1707 "psubh %[ftmp2], %[ftmp2], %[ftmp6] \n\t"
1708 "psubh %[ftmp1], %[ftmp1], %[ftmp3] \n\t"
1709 "pmullh %[ftmp2], %[ftmp2], %[ff_pw_5] \n\t"
1710 "pmullh %[ftmp1], %[ftmp1], %[ff_pw_5] \n\t"
1711 MMI_ULWC1(%[ftmp3], %[
src], -0x02)
1712 MMI_ULWC1(%[ftmp6], %[
src], 0x07)
1713 "punpcklbh %[ftmp3], %[ftmp3], %[ftmp0] \n\t"
1714 "punpcklbh %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
1715 "paddh %[ftmp3], %[ftmp3], %[ftmp4] \n\t"
1716 "paddh %[ftmp5], %[ftmp5], %[ftmp6] \n\t"
1717 "paddh %[ftmp3], %[ftmp3], %[ff_pw_16] \n\t"
1718 "paddh %[ftmp5], %[ftmp5], %[ff_pw_16] \n\t"
1719 "paddh %[ftmp1], %[ftmp1], %[ftmp3] \n\t"
1720 "paddh %[ftmp2], %[ftmp2], %[ftmp5] \n\t"
1721 "psrah %[ftmp1], %[ftmp1], %[ftmp8] \n\t"
1722 "psrah %[ftmp2], %[ftmp2], %[ftmp8] \n\t"
1723 MMI_LDC1(%[ftmp5], %[
src2], 0x00)
1724 "packushb %[ftmp1], %[ftmp1], %[ftmp2] \n\t"
1725 PTR_ADDU "%[src], %[src], %[dstStride] \n\t"
1726 "pavgb %[ftmp1], %[ftmp1], %[ftmp5] \n\t"
1728 MMI_SDC1(%[ftmp1], %[
dst], 0x00)
1729 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
1730 PTR_ADDU "%[src2], %[src2], %[src2Stride] \n\t"
1731 "bgtz %[h], 1b \n\t"
1732 : [ftmp0]
"=&f"(ftmp[0]), [ftmp1]
"=&f"(ftmp[1]),
1733 [ftmp2]
"=&f"(ftmp[2]), [ftmp3]
"=&f"(ftmp[3]),
1734 [ftmp4]
"=&f"(ftmp[4]), [ftmp5]
"=&f"(ftmp[5]),
1735 [ftmp6]
"=&f"(ftmp[6]), [ftmp7]
"=&f"(ftmp[7]),
1736 [ftmp8]
"=&f"(ftmp[8]),
1737 [tmp0]
"=&r"(
tmp[0]),
1742 : [src2Stride]
"r"((
mips_reg)src2Stride),
1743 [dstStride]
"r"((
mips_reg)dstStride),
1750 const uint8_t *src8, ptrdiff_t dstStride, ptrdiff_t src8Stride,
int h)
1759 "dli %[tmp0], 0x05 \n\t"
1760 MMI_ULDC1(%[ftmp0], %[src16], 0x00)
1761 "mtc1 %[tmp0], %[ftmp6] \n\t"
1762 MMI_ULDC1(%[ftmp1], %[src16], 0x08)
1763 MMI_ULDC1(%[ftmp2], %[src16], 0x30)
1764 MMI_ULDC1(%[ftmp3], %[src16], 0x38)
1765 "psrah %[ftmp0], %[ftmp0], %[ftmp6] \n\t"
1766 "psrah %[ftmp1], %[ftmp1], %[ftmp6] \n\t"
1767 "psrah %[ftmp2], %[ftmp2], %[ftmp6] \n\t"
1768 "psrah %[ftmp3], %[ftmp3], %[ftmp6] \n\t"
1769 "packushb %[ftmp0], %[ftmp0], %[ftmp1] \n\t"
1770 "packushb %[ftmp2], %[ftmp2], %[ftmp3] \n\t"
1771 MMI_LDC1(%[ftmp5], %[src8], 0x00)
1772 MMI_LDXC1(%[ftmp4], %[src8], %[src8Stride], 0x00)
1773 "pavgb %[ftmp0], %[ftmp0], %[ftmp5] \n\t"
1774 "pavgb %[ftmp2], %[ftmp2], %[ftmp4] \n\t"
1775 MMI_SDC1(%[ftmp0], %[
dst], 0x00)
1776 MMI_SDXC1(%[ftmp2], %[
dst], %[dstStride], 0x00)
1777 : [ftmp0]
"=&f"(ftmp[0]), [ftmp1]
"=&f"(ftmp[1]),
1778 [ftmp2]
"=&f"(ftmp[2]), [ftmp3]
"=&f"(ftmp[3]),
1779 [ftmp4]
"=&f"(ftmp[4]), [ftmp5]
"=&f"(ftmp[5]),
1780 [ftmp6]
"=&f"(ftmp[6]),
1784 : [src8]
"r"(src8), [src16]
"r"(src16),
1786 [src8Stride]
"r"((
mips_reg)src8Stride),
1787 [dstStride]
"r"((
mips_reg)dstStride)
1791 src8 += 2 * src8Stride;
1793 dst += 2 * dstStride;
1798 const uint8_t *
src2, ptrdiff_t dstStride, ptrdiff_t src2Stride)
1804 src += 8 * dstStride;
1805 dst += 8 * dstStride;
1806 src2 += 8 * src2Stride;
1814 const uint8_t *src8, ptrdiff_t dstStride, ptrdiff_t src8Stride,
int h)
1822 int dstStride,
int srcStride)
1826 int16_t *
tmp = _tmp;
1834 "pxor %[ftmp0], %[ftmp0], %[ftmp0] \n\t"
1835 "dli %[tmp0], 0x09 \n\t"
1837 MMI_ULWC1(%[ftmp1], %[
src], -0x02)
1838 MMI_ULWC1(%[ftmp2], %[
src], -0x01)
1839 MMI_ULWC1(%[ftmp3], %[
src], 0x00)
1840 MMI_ULWC1(%[ftmp4], %[
src], 0x01)
1841 MMI_ULWC1(%[ftmp5], %[
src], 0x02)
1842 MMI_ULWC1(%[ftmp6], %[
src], 0x03)
1843 "punpcklbh %[ftmp1], %[ftmp1], %[ftmp0] \n\t"
1844 "punpcklbh %[ftmp2], %[ftmp2], %[ftmp0] \n\t"
1845 "punpcklbh %[ftmp3], %[ftmp3], %[ftmp0] \n\t"
1846 "punpcklbh %[ftmp4], %[ftmp4], %[ftmp0] \n\t"
1847 "punpcklbh %[ftmp5], %[ftmp5], %[ftmp0] \n\t"
1848 "punpcklbh %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
1849 "paddsh %[ftmp7], %[ftmp3], %[ftmp4] \n\t"
1850 "paddsh %[ftmp8], %[ftmp2], %[ftmp5] \n\t"
1851 "paddsh %[ftmp9], %[ftmp1], %[ftmp6] \n\t"
1852 "pmullh %[ftmp7], %[ftmp7], %[ff_pw_20] \n\t"
1853 "pmullh %[ftmp8], %[ftmp8], %[ff_pw_5] \n\t"
1854 "psubsh %[ftmp7], %[ftmp7], %[ftmp8] \n\t"
1855 "paddsh %[ftmp9], %[ftmp7], %[ftmp9] \n\t"
1856 MMI_SDC1(%[ftmp9], %[
tmp], 0x00)
1857 "daddi %[tmp0], %[tmp0], -0x01 \n\t"
1858 PTR_ADDU "%[src], %[src], %[srcStride] \n\t"
1859 PTR_ADDU "%[tmp], %[tmp], %[tmpStride] \n\t"
1860 "bnez %[tmp0], 1b \n\t"
1861 : [ftmp0]
"=&f"(ftmp[0]), [ftmp1]
"=&f"(ftmp[1]),
1862 [ftmp2]
"=&f"(ftmp[2]), [ftmp3]
"=&f"(ftmp[3]),
1863 [ftmp4]
"=&f"(ftmp[4]), [ftmp5]
"=&f"(ftmp[5]),
1864 [ftmp6]
"=&f"(ftmp[6]), [ftmp7]
"=&f"(ftmp[7]),
1865 [ftmp8]
"=&f"(ftmp[8]), [ftmp9]
"=&f"(ftmp[9]),
1869 : [tmpStride]
"r"(8),
1870 [srcStride]
"r"((
mips_reg)srcStride),
1877 for (
i=0;
i<4;
i++) {
1878 const int16_t tmpB=
tmp[-8];
1879 const int16_t tmpA=
tmp[-4];
1880 const int16_t tmp0=
tmp[ 0];
1881 const int16_t tmp1=
tmp[ 4];
1882 const int16_t tmp2=
tmp[ 8];
1883 const int16_t tmp3=
tmp[12];
1884 const int16_t tmp4=
tmp[16];
1885 const int16_t tmp5=
tmp[20];
1886 const int16_t tmp6=
tmp[24];
1887 op2_avg(
dst[0*dstStride], (tmp0+tmp1)*20 - (tmpA+tmp2)*5 + (tmpB+tmp3));
1888 op2_avg(
dst[1*dstStride], (tmp1+tmp2)*20 - (tmp0+tmp3)*5 + (tmpA+tmp4));
1889 op2_avg(
dst[2*dstStride], (tmp2+tmp3)*20 - (tmp1+tmp4)*5 + (tmp0+tmp5));
1890 op2_avg(
dst[3*dstStride], (tmp3+tmp4)*20 - (tmp2+tmp5)*5 + (tmp1+tmp6));
1897 int16_t *
tmp, ptrdiff_t dstStride, ptrdiff_t tmpStride,
int size)
1907 "dli %[tmp0], 0x02 \n\t"
1908 "mtc1 %[tmp0], %[ftmp9] \n\t"
1909 "dli %[tmp0], 0x06 \n\t"
1910 "mtc1 %[tmp0], %[ftmp10] \n\t"
1912 MMI_LDC1(%[ftmp0], %[
tmp], 0x00)
1913 MMI_LDC1(%[ftmp3], %[
tmp], 0x08)
1914 MMI_ULDC1(%[ftmp1], %[
tmp], 0x02)
1915 MMI_ULDC1(%[ftmp4], %[
tmp], 0x0a)
1916 MMI_LDC1(%[ftmp7], %[
tmp], 0x10)
1917 MMI_ULDC1(%[ftmp8], %[
tmp], 0x12)
1918 "paddh %[ftmp0], %[ftmp0], %[ftmp4] \n\t"
1919 "paddh %[ftmp1], %[ftmp1], %[ftmp3] \n\t"
1920 "paddh %[ftmp3], %[ftmp3], %[ftmp8] \n\t"
1921 "paddh %[ftmp4], %[ftmp4], %[ftmp7] \n\t"
1922 MMI_ULDC1(%[ftmp2], %[
tmp], 0x04)
1923 MMI_ULDC1(%[ftmp5], %[
tmp], 0x0c)
1924 MMI_ULDC1(%[ftmp7], %[
tmp], 0x06)
1925 MMI_ULDC1(%[ftmp8], %[
tmp], 0x0e)
1926 "paddh %[ftmp2], %[ftmp2], %[ftmp7] \n\t"
1927 "paddh %[ftmp5], %[ftmp5], %[ftmp8] \n\t"
1928 "psubh %[ftmp0], %[ftmp0], %[ftmp1] \n\t"
1929 "psubh %[ftmp3], %[ftmp3], %[ftmp4] \n\t"
1930 "psrah %[ftmp0], %[ftmp0], %[ftmp9] \n\t"
1931 "psrah %[ftmp3], %[ftmp3], %[ftmp9] \n\t"
1932 "psubh %[ftmp0], %[ftmp0], %[ftmp1] \n\t"
1933 "psubh %[ftmp3], %[ftmp3], %[ftmp4] \n\t"
1934 "paddsh %[ftmp0], %[ftmp0], %[ftmp2] \n\t"
1935 "paddsh %[ftmp3], %[ftmp3], %[ftmp5] \n\t"
1936 "psrah %[ftmp0], %[ftmp0], %[ftmp9] \n\t"
1937 "psrah %[ftmp3], %[ftmp3], %[ftmp9] \n\t"
1938 "paddh %[ftmp0], %[ftmp0], %[ftmp2] \n\t"
1939 "paddh %[ftmp3], %[ftmp3], %[ftmp5] \n\t"
1940 "psrah %[ftmp0], %[ftmp0], %[ftmp10] \n\t"
1941 "psrah %[ftmp3], %[ftmp3], %[ftmp10] \n\t"
1942 "packushb %[ftmp0], %[ftmp0], %[ftmp3] \n\t"
1943 MMI_LDC1(%[ftmp6], %[
dst], 0x00)
1944 "pavgb %[ftmp0], %[ftmp0], %[ftmp6] \n\t"
1945 MMI_SDC1(%[ftmp0], %[
dst], 0x00)
1946 "addi %[h], %[h], -0x01 \n\t"
1947 PTR_ADDI "%[tmp], %[tmp], 0x30 \n\t"
1948 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
1949 "bnez %[h], 1b \n\t"
1950 : [ftmp0]
"=&f"(ftmp[0]), [ftmp1]
"=&f"(ftmp[1]),
1951 [ftmp2]
"=&f"(ftmp[2]), [ftmp3]
"=&f"(ftmp[3]),
1952 [ftmp4]
"=&f"(ftmp[4]), [ftmp5]
"=&f"(ftmp[5]),
1953 [ftmp6]
"=&f"(ftmp[6]), [ftmp7]
"=&f"(ftmp[7]),
1954 [ftmp8]
"=&f"(ftmp[8]), [ftmp9]
"=&f"(ftmp[9]),
1955 [ftmp10]
"=&f"(ftmp[10]),
1960 : [dstStride]
"r"((
mips_reg)dstStride)
1970 const uint8_t *
src, ptrdiff_t dstStride, ptrdiff_t tmpStride,
1971 ptrdiff_t srcStride,
int size)
1978 const uint8_t *
src, ptrdiff_t dstStride, ptrdiff_t tmpStride,
1979 ptrdiff_t srcStride)
1986 const uint8_t *
src, ptrdiff_t dstStride, ptrdiff_t tmpStride,
1987 ptrdiff_t srcStride)
1994 const uint8_t *
src2, ptrdiff_t dstStride, ptrdiff_t src2Stride)
2002 "dli %[tmp1], 0x02 \n\t"
2003 "ori %[tmp0], $0, 0x8 \n\t"
2004 "mtc1 %[tmp1], %[ftmp7] \n\t"
2005 "dli %[tmp1], 0x05 \n\t"
2006 "pxor %[ftmp0], %[ftmp0], %[ftmp0] \n\t"
2007 "mtc1 %[tmp1], %[ftmp8] \n\t"
2009 MMI_ULDC1(%[ftmp1], %[
src], 0x00)
2010 MMI_ULDC1(%[ftmp2], %[
src], 0x01)
2011 "punpckhbh %[ftmp3], %[ftmp1], %[ftmp0] \n\t"
2012 "punpcklbh %[ftmp1], %[ftmp1], %[ftmp0] \n\t"
2013 "punpckhbh %[ftmp4], %[ftmp2], %[ftmp0] \n\t"
2014 "punpcklbh %[ftmp2], %[ftmp2], %[ftmp0] \n\t"
2015 "paddh %[ftmp1], %[ftmp1], %[ftmp2] \n\t"
2016 "paddh %[ftmp3], %[ftmp3], %[ftmp4] \n\t"
2017 "psllh %[ftmp1], %[ftmp1], %[ftmp7] \n\t"
2018 "psllh %[ftmp3], %[ftmp3], %[ftmp7] \n\t"
2019 MMI_ULDC1(%[ftmp2], %[
src], -0x01)
2020 MMI_ULDC1(%[ftmp5], %[
src], 0x02)
2021 "punpckhbh %[ftmp4], %[ftmp2], %[ftmp0] \n\t"
2022 "punpcklbh %[ftmp2], %[ftmp2], %[ftmp0] \n\t"
2023 "punpckhbh %[ftmp6], %[ftmp5], %[ftmp0] \n\t"
2024 "punpcklbh %[ftmp5], %[ftmp5], %[ftmp0] \n\t"
2025 "paddh %[ftmp2], %[ftmp2], %[ftmp5] \n\t"
2026 "paddh %[ftmp6], %[ftmp6], %[ftmp4] \n\t"
2027 "psubh %[ftmp1], %[ftmp1], %[ftmp2] \n\t"
2028 "psubh %[ftmp3], %[ftmp3], %[ftmp6] \n\t"
2029 "pmullh %[ftmp1], %[ftmp1], %[ff_pw_5] \n\t"
2030 "pmullh %[ftmp3], %[ftmp3], %[ff_pw_5] \n\t"
2031 MMI_ULWC1(%[ftmp2], %[
src], -0x02)
2032 MMI_ULWC1(%[ftmp6], %[
src], 0x07)
2033 "punpcklbh %[ftmp2], %[ftmp2], %[ftmp0] \n\t"
2034 "punpcklbh %[ftmp6], %[ftmp6], %[ftmp0] \n\t"
2035 "paddh %[ftmp2], %[ftmp2], %[ftmp4] \n\t"
2036 "paddh %[ftmp5], %[ftmp5], %[ftmp6] \n\t"
2037 "paddh %[ftmp2], %[ftmp2], %[ff_pw_16] \n\t"
2038 "paddh %[ftmp5], %[ftmp5], %[ff_pw_16] \n\t"
2039 "paddh %[ftmp1], %[ftmp1], %[ftmp2] \n\t"
2040 "paddh %[ftmp3], %[ftmp3], %[ftmp5] \n\t"
2041 "psrah %[ftmp1], %[ftmp1], %[ftmp8] \n\t"
2042 "psrah %[ftmp3], %[ftmp3], %[ftmp8] \n\t"
2043 MMI_LDC1(%[ftmp5], %[
src2], 0x00)
2044 "packushb %[ftmp1], %[ftmp1], %[ftmp3] \n\t"
2045 MMI_LDC1(%[ftmp9], %[
dst], 0x00)
2046 "pavgb %[ftmp1], %[ftmp1], %[ftmp5] \n\t"
2047 "pavgb %[ftmp1], %[ftmp1], %[ftmp9] \n\t"
2048 PTR_ADDU "%[src], %[src], %[dstStride] \n\t"
2049 MMI_SDC1(%[ftmp1], %[
dst], 0x00)
2050 "daddi %[tmp0], %[tmp0], -0x01 \n\t"
2051 PTR_ADDU "%[dst], %[dst], %[dstStride] \n\t"
2052 PTR_ADDU "%[src2], %[src2], %[src2Stride] \n\t"
2053 "bgtz %[tmp0], 1b \n\t"
2054 : [ftmp0]
"=&f"(ftmp[0]), [ftmp1]
"=&f"(ftmp[1]),
2055 [ftmp2]
"=&f"(ftmp[2]), [ftmp3]
"=&f"(ftmp[3]),
2056 [ftmp4]
"=&f"(ftmp[4]), [ftmp5]
"=&f"(ftmp[5]),
2057 [ftmp6]
"=&f"(ftmp[6]), [ftmp7]
"=&f"(ftmp[7]),
2058 [ftmp8]
"=&f"(ftmp[8]), [ftmp9]
"=&f"(ftmp[9]),
2059 [tmp0]
"=&r"(
tmp[0]), [tmp1]
"=&r"(
tmp[1]),
2064 : [dstStride]
"r"((
mips_reg)dstStride),
2065 [src2Stride]
"r"((
mips_reg)src2Stride),
2072 const uint8_t *
src2, ptrdiff_t dstStride, ptrdiff_t src2Stride)
2078 src += 8 * dstStride;
2079 dst += 8 * dstStride;
2080 src2 += 8 * src2Stride;
2088 const uint8_t *src8, ptrdiff_t dstStride, ptrdiff_t src8Stride,
int b)
2097 "dli %[tmp0], 0x05 \n\t"
2098 MMI_ULDC1(%[ftmp0], %[src16], 0x00)
2099 "mtc1 %[tmp0], %[ftmp6] \n\t"
2100 MMI_ULDC1(%[ftmp1], %[src16], 0x08)
2101 MMI_ULDC1(%[ftmp2], %[src16], 0x30)
2102 MMI_ULDC1(%[ftmp3], %[src16], 0x38)
2103 "psrah %[ftmp0], %[ftmp0], %[ftmp6] \n\t"
2104 "psrah %[ftmp1], %[ftmp1], %[ftmp6] \n\t"
2105 "psrah %[ftmp2], %[ftmp2], %[ftmp6] \n\t"
2106 "psrah %[ftmp3], %[ftmp3], %[ftmp6] \n\t"
2107 "packushb %[ftmp0], %[ftmp0], %[ftmp1] \n\t"
2108 MMI_LDC1(%[ftmp4], %[src8], 0x00)
2109 MMI_LDXC1(%[ftmp5], %[src8], %[src8Stride], 0x00)
2110 "packushb %[ftmp2], %[ftmp2], %[ftmp3] \n\t"
2111 "pavgb %[ftmp0], %[ftmp0], %[ftmp4] \n\t"
2112 "pavgb %[ftmp2], %[ftmp2], %[ftmp5] \n\t"
2113 MMI_LDC1(%[ftmp7], %[
dst], 0x00)
2114 "pavgb %[ftmp0], %[ftmp0], %[ftmp7] \n\t"
2115 MMI_SDC1(%[ftmp0], %[
dst], 0x00)
2116 MMI_LDXC1(%[ftmp7], %[
dst], %[dstStride], 0x00)
2117 "pavgb %[ftmp2], %[ftmp2], %[ftmp7] \n\t"
2118 MMI_SDXC1(%[ftmp2], %[
dst], %[dstStride], 0x00)
2119 : [ftmp0]
"=&f"(ftmp[0]), [ftmp1]
"=&f"(ftmp[1]),
2120 [ftmp2]
"=&f"(ftmp[2]), [ftmp3]
"=&f"(ftmp[3]),
2121 [ftmp4]
"=&f"(ftmp[4]), [ftmp5]
"=&f"(ftmp[5]),
2122 [ftmp6]
"=&f"(ftmp[6]), [ftmp7]
"=&f"(ftmp[7]),
2126 : [src8]
"r"(src8), [src16]
"r"(src16),
2128 [src8Stride]
"r"((
mips_reg)src8Stride),
2129 [dstStride]
"r"((
mips_reg)dstStride)
2133 src8 += 2 * src8Stride;
2135 dst += 2 * dstStride;
2140 const uint8_t *src8, ptrdiff_t dstStride, ptrdiff_t src8Stride,
int b)
2180 uint8_t *
const full_mid= full + 8;
2191 uint8_t *
const full_mid= full + 8;
2200 uint8_t *
const full_mid= full + 8;
2211 uint8_t *
const full_mid= full + 8;
2224 uint8_t *
const full_mid= full + 8;
2237 uint8_t *
const full_mid= full + 8;
2250 uint8_t *
const full_mid= full + 8;
2289 uint8_t *
const full_mid= full + 8;
2302 uint8_t *
const full_mid= full + 8;
2344 uint8_t *
const full_mid= full + 8;
2355 uint8_t *
const full_mid= full + 8;
2364 uint8_t *
const full_mid= full + 8;
2375 uint8_t *
const full_mid= full + 8;
2388 uint8_t *
const full_mid= full + 8;
2401 uint8_t *
const full_mid= full + 8;
2414 uint8_t *
const full_mid= full + 8;
2453 uint8_t *
const full_mid= full + 8;
2466 uint8_t *
const full_mid= full + 8;
2508 uint8_t *
const full_mid= full + 16;
2519 uint8_t *
const full_mid= full + 16;
2528 uint8_t *
const full_mid= full + 16;
2539 uint8_t *
const full_mid= full + 16;
2552 uint8_t *
const full_mid= full + 16;
2565 uint8_t *
const full_mid= full + 16;
2578 uint8_t *
const full_mid= full + 16;
2599 uint8_t *
const halfHV =
temp;
2600 int16_t *
const halfV = (int16_t *) (
temp + 64);
2610 uint8_t *
const halfHV =
temp;
2611 int16_t *
const halfV = (int16_t *) (
temp + 64);
2621 uint8_t *
const halfHV =
temp;
2622 int16_t *
const halfV = (int16_t *) (
temp + 64);
2632 uint8_t *
const halfHV =
temp;
2633 int16_t *
const halfV = (int16_t *) (
temp + 64);
2672 uint8_t *
const full_mid= full + 16;
2683 uint8_t *
const full_mid= full + 16;
2692 uint8_t *
const full_mid= full + 16;
2703 uint8_t *
const full_mid= full + 16;
2716 uint8_t *
const full_mid= full + 16;
2729 uint8_t *
const full_mid= full + 16;
2742 uint8_t *
const full_mid= full + 16;
2763 uint8_t *
const halfHV =
temp;
2764 int16_t *
const halfV = (int16_t *) (
temp + 64);
2774 uint8_t *
const halfHV =
temp;
2775 int16_t *
const halfV = (int16_t *) (
temp + 64);
2785 uint8_t *
const halfHV =
temp;
2786 int16_t *
const halfV = (int16_t *) (
temp + 64);
2796 uint8_t *
const halfHV =
temp;
2797 int16_t *
const halfV = (int16_t *) (
temp + 64);
2836 uint8_t *
const full_mid= full + 32;
2847 uint8_t *
const full_mid= full + 32;
2856 uint8_t *
const full_mid= full + 32;
2867 uint8_t *
const full_mid= full + 32;
2880 uint8_t *
const full_mid= full + 32;
2893 uint8_t *
const full_mid= full + 32;
2906 uint8_t *
const full_mid= full + 32;
2927 uint8_t *
const halfHV =
temp;
2928 int16_t *
const halfV = (int16_t *) (
temp + 256);
2938 uint8_t *
const halfHV =
temp;
2939 int16_t *
const halfV = (int16_t *) (
temp + 256);
2949 uint8_t *
const halfHV =
temp;
2950 int16_t *
const halfV = (int16_t *) (
temp + 256);
2960 uint8_t *
const halfHV =
temp;
2961 int16_t *
const halfV = (int16_t *) (
temp + 256);
3000 uint8_t *
const full_mid= full + 32;
3011 uint8_t *
const full_mid= full + 32;
3020 uint8_t *
const full_mid= full + 32;
3031 uint8_t *
const full_mid= full + 32;
3044 uint8_t *
const full_mid= full + 32;
3057 uint8_t *
const full_mid= full + 32;
3070 uint8_t *
const full_mid= full + 32;
3091 uint8_t *
const halfHV =
temp;
3092 int16_t *
const halfV = (int16_t *) (
temp + 256);
3102 uint8_t *
const halfHV =
temp;
3103 int16_t *
const halfV = (int16_t *) (
temp + 256);
3113 uint8_t *
const halfHV =
temp;
3114 int16_t *
const halfV = (int16_t *) (
temp + 256);
3124 uint8_t *
const halfHV =
temp;
3125 int16_t *
const halfV = (int16_t *) (
temp + 256);
void ff_put_h264_qpel8_mc13_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_h264_qpel16_mc03_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_h264_qpel4_mc23_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_avg_h264_qpel8_mc22_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_avg_h264_qpel4_mc02_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_pixels4_l2_8_mmi(uint8_t *dst, const uint8_t *src1, const uint8_t *src2, int dst_stride, int src_stride1, int src_stride2, int h)
static void put_h264_qpel4_v_lowpass_mmi(uint8_t *dst, const uint8_t *src, int dstStride, int srcStride)
static void avg_h264_qpel16_hv_lowpass_mmi(uint8_t *dst, int16_t *tmp, const uint8_t *src, ptrdiff_t dstStride, ptrdiff_t tmpStride, ptrdiff_t srcStride)
void ff_avg_h264_qpel8_mc11_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_avg_h264_qpel8_mc31_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_avg_h264_qpel8_mc10_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
static void put_h264_qpel8or16_hv1_lowpass_mmi(int16_t *tmp, const uint8_t *src, ptrdiff_t tmpStride, ptrdiff_t srcStride, int size)
void ff_avg_h264_qpel8_mc30_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_avg_h264_qpel16_mc11_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_h264_qpel4_mc33_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
static void put_h264_qpel8_h_lowpass_l2_mmi(uint8_t *dst, const uint8_t *src, const uint8_t *src2, ptrdiff_t dstStride, ptrdiff_t src2Stride)
void ff_put_h264_qpel4_mc20_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_h264_qpel16_mc23_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
#define DECLARE_VAR_LOW32
static void avg_h264_qpel8_h_lowpass_mmi(uint8_t *dst, const uint8_t *src, int dstStride, int srcStride)
void ff_put_h264_qpel8_mc00_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
static void avg_h264_qpel8or16_hv_lowpass_mmi(uint8_t *dst, int16_t *tmp, const uint8_t *src, ptrdiff_t dstStride, ptrdiff_t tmpStride, ptrdiff_t srcStride, int size)
void ff_put_h264_qpel16_mc12_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
static uint8_t half(int a, int b)
void ff_avg_h264_qpel4_mc11_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_h264_qpel4_mc13_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_h264_qpel8_mc02_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_avg_h264_qpel16_mc31_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_avg_pixels8_8_mmi(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int32_t h)
void ff_avg_h264_qpel4_mc10_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_h264_qpel4_mc32_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
static void avg_h264_qpel16_h_lowpass_l2_mmi(uint8_t *dst, const uint8_t *src, const uint8_t *src2, ptrdiff_t dstStride, ptrdiff_t src2Stride)
static void put_h264_qpel8_hv_lowpass_mmi(uint8_t *dst, int16_t *tmp, const uint8_t *src, ptrdiff_t dstStride, ptrdiff_t tmpStride, ptrdiff_t srcStride)
void ff_put_h264_qpel8_mc33_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_avg_pixels4_l2_8_mmi(uint8_t *dst, const uint8_t *src1, const uint8_t *src2, int dst_stride, int src_stride1, int src_stride2, int h)
void ff_put_h264_qpel4_mc02_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_h264_qpel4_mc12_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_avg_h264_qpel16_mc32_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_h264_qpel16_mc31_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_avg_h264_qpel16_mc21_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_avg_h264_qpel8_mc33_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
static void put_h264_qpel4_h_lowpass_mmi(uint8_t *dst, const uint8_t *src, int dstStride, int srcStride)
static void avg_h264_qpel16_h_lowpass_mmi(uint8_t *dst, const uint8_t *src, int dstStride, int srcStride)
void ff_avg_h264_qpel4_mc00_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_h264_qpel16_mc01_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_avg_h264_qpel4_mc32_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_h264_qpel8_mc31_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
static int aligned(int val)
void ff_put_pixels8_8_mmi(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int32_t h)
void ff_avg_h264_qpel16_mc10_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
static void avg_h264_qpel8_h_lowpass_l2_mmi(uint8_t *dst, const uint8_t *src, const uint8_t *src2, ptrdiff_t dstStride, ptrdiff_t src2Stride)
void ff_avg_h264_qpel4_mc12_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_avg_h264_qpel8_mc32_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_avg_h264_qpel16_mc23_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
const union av_intfloat64 ff_pw_20
static void put_h264_qpel8or16_hv2_lowpass_mmi(uint8_t *dst, int16_t *tmp, ptrdiff_t dstStride, ptrdiff_t tmpStride, int size)
void ff_avg_h264_qpel4_mc23_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
static void put_h264_qpel8or16_hv_lowpass_mmi(uint8_t *dst, int16_t *tmp, const uint8_t *src, ptrdiff_t dstStride, ptrdiff_t tmpStride, ptrdiff_t srcStride, int size)
void ff_put_h264_qpel4_mc30_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_h264_qpel4_mc01_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_avg_h264_qpel16_mc12_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_h264_qpel4_mc11_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
static void avg_h264_qpel8_v_lowpass_mmi(uint8_t *dst, const uint8_t *src, int dstStride, int srcStride)
static void put_h264_qpel4_hv_lowpass_mmi(uint8_t *dst, const uint8_t *src, int dstStride, int srcStride)
void ff_avg_h264_qpel8_mc13_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_avg_h264_qpel4_mc30_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
static void put_h264_qpel16_hv_lowpass_mmi(uint8_t *dst, int16_t *tmp, const uint8_t *src, ptrdiff_t dstStride, ptrdiff_t tmpStride, ptrdiff_t srcStride)
static void avg_h264_qpel8or16_hv2_lowpass_mmi(uint8_t *dst, int16_t *tmp, ptrdiff_t dstStride, ptrdiff_t tmpStride, int size)
void ff_avg_h264_qpel16_mc03_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
static void copy_block16_mmi(uint8_t *dst, const uint8_t *src, int dstStride, int srcStride, int h)
static void put_h264_qpel16_h_lowpass_mmi(uint8_t *dst, const uint8_t *src, int dstStride, int srcStride)
void ff_put_h264_qpel8_mc12_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_avg_h264_qpel4_mc31_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
static void put_h264_qpel16_v_lowpass_mmi(uint8_t *dst, const uint8_t *src, int dstStride, int srcStride)
void ff_avg_h264_qpel8_mc01_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_avg_h264_qpel4_mc01_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_h264_qpel16_mc00_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_avg_h264_qpel16_mc20_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_avg_h264_qpel8_mc12_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_h264_qpel8_mc11_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_avg_pixels16_l2_8_mmi(uint8_t *dst, const uint8_t *src1, const uint8_t *src2, int dst_stride, int src_stride1, int src_stride2, int h)
uint8_t ptrdiff_t const uint8_t ptrdiff_t int intptr_t intptr_t int int16_t * dst
void ff_put_h264_qpel8_mc32_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
static void avg_pixels8_l2_shift5_mmi(uint8_t *dst, int16_t *src16, const uint8_t *src8, ptrdiff_t dstStride, ptrdiff_t src8Stride, int b)
static void avg_h264_qpel16_v_lowpass_mmi(uint8_t *dst, const uint8_t *src, int dstStride, int srcStride)
void ff_avg_h264_qpel16_mc13_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
static void avg_h264_qpel4_h_lowpass_mmi(uint8_t *dst, const uint8_t *src, int dstStride, int srcStride)
void ff_put_h264_qpel4_mc10_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_avg_h264_qpel8_mc03_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
#define DECLARE_VAR_ALL64
void ff_put_h264_qpel4_mc03_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_h264_qpel16_mc11_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
static void put_pixels8_l2_shift5_mmi(uint8_t *dst, int16_t *src16, const uint8_t *src8, ptrdiff_t dstStride, ptrdiff_t src8Stride, int h)
static void put_h264_qpel8_v_lowpass_mmi(uint8_t *dst, const uint8_t *src, int dstStride, int srcStride)
void ff_avg_h264_qpel16_mc22_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
static void avg_h264_qpel8_hv_lowpass_mmi(uint8_t *dst, int16_t *tmp, const uint8_t *src, ptrdiff_t dstStride, ptrdiff_t tmpStride, ptrdiff_t srcStride)
void ff_avg_h264_qpel16_mc33_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_avg_h264_qpel8_mc02_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_h264_qpel8_mc10_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_avg_h264_qpel4_mc20_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_h264_qpel8_mc01_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
#define i(width, name, range_min, range_max)
static void avg_pixels16_l2_shift5_mmi(uint8_t *dst, int16_t *src16, const uint8_t *src8, ptrdiff_t dstStride, ptrdiff_t src8Stride, int b)
void ff_avg_h264_qpel16_mc00_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_h264_qpel16_mc33_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
static void put_pixels16_l2_shift5_mmi(uint8_t *dst, int16_t *src16, const uint8_t *src8, ptrdiff_t dstStride, ptrdiff_t src8Stride, int h)
static void avg_h264_qpel4_v_lowpass_mmi(uint8_t *dst, const uint8_t *src, int dstStride, int srcStride)
void ff_avg_h264_qpel4_mc22_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
static void put_h264_qpel8_h_lowpass_mmi(uint8_t *dst, const uint8_t *src, int dstStride, int srcStride)
static void copy_block8_mmi(uint8_t *dst, const uint8_t *src, int dstStride, int srcStride, int h)
void ff_put_h264_qpel8_mc22_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_avg_pixels8_l2_8_mmi(uint8_t *dst, const uint8_t *src1, const uint8_t *src2, int dst_stride, int src_stride1, int src_stride2, int h)
void ff_avg_h264_qpel16_mc02_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
static void copy_block4_mmi(uint8_t *dst, const uint8_t *src, int dstStride, int srcStride, int h)
static void avg_h264_qpel4_hv_lowpass_mmi(uint8_t *dst, const uint8_t *src, int dstStride, int srcStride)
void ff_avg_pixels16_8_mmi(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int32_t h)
__asm__(".macro parse_r var r\n\t" "\\var = -1\n\t" _IFC_REG(0) _IFC_REG(1) _IFC_REG(2) _IFC_REG(3) _IFC_REG(4) _IFC_REG(5) _IFC_REG(6) _IFC_REG(7) _IFC_REG(8) _IFC_REG(9) _IFC_REG(10) _IFC_REG(11) _IFC_REG(12) _IFC_REG(13) _IFC_REG(14) _IFC_REG(15) _IFC_REG(16) _IFC_REG(17) _IFC_REG(18) _IFC_REG(19) _IFC_REG(20) _IFC_REG(21) _IFC_REG(22) _IFC_REG(23) _IFC_REG(24) _IFC_REG(25) _IFC_REG(26) _IFC_REG(27) _IFC_REG(28) _IFC_REG(29) _IFC_REG(30) _IFC_REG(31) ".iflt \\var\n\t" ".error \"Unable to parse register name \\r\"\n\t" ".endif\n\t" ".endm")
void ff_put_h264_qpel4_mc00_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
static void put_h264_qpel16_h_lowpass_l2_mmi(uint8_t *dst, const uint8_t *src, const uint8_t *src2, ptrdiff_t dstStride, ptrdiff_t src2Stride)
void ff_put_h264_qpel4_mc22_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_avg_h264_qpel16_mc01_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_h264_qpel8_mc21_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
#define RESTRICT_ASM_LOW32
#define DECLARE_VAR_ADDRT
void ff_put_h264_qpel8_mc30_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_pixels4_8_mmi(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int32_t h)
void ff_avg_h264_qpel8_mc21_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_h264_qpel16_mc13_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_h264_qpel4_mc21_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_avg_h264_qpel4_mc03_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_avg_h264_qpel16_mc30_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_h264_qpel8_mc03_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_h264_qpel8_mc20_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_h264_qpel8_mc23_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_avg_h264_qpel8_mc20_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_h264_qpel16_mc10_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_h264_qpel16_mc30_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_avg_h264_qpel4_mc33_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_h264_qpel16_mc21_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_avg_h264_qpel4_mc21_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_pixels16_8_mmi(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int32_t h)
void ff_put_h264_qpel16_mc22_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_h264_qpel16_mc20_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_avg_h264_qpel4_mc13_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_h264_qpel4_mc31_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
const union av_intfloat64 ff_pw_5
#define RESTRICT_ASM_ADDRT
#define RESTRICT_ASM_ALL64
void ff_avg_h264_qpel8_mc23_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_h264_qpel16_mc02_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_h264_qpel16_mc32_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
const union av_intfloat64 ff_pw_16
void ff_put_pixels16_l2_8_mmi(uint8_t *dst, const uint8_t *src1, const uint8_t *src2, int dst_stride, int src_stride1, int src_stride2, int h)
void ff_avg_pixels4_8_mmi(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int32_t h)
void ff_avg_h264_qpel8_mc00_mmi(uint8_t *dst, const uint8_t *src, ptrdiff_t stride)
void ff_put_pixels8_l2_8_mmi(uint8_t *dst, const uint8_t *src1, const uint8_t *src2, int dst_stride, int src_stride1, int src_stride2, int h)