123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114 |
- /*
- * Copyright (c) 2017 The WebM project authors. All Rights Reserved.
- *
- * Use of this source code is governed by a BSD-style license
- * that can be found in the LICENSE file in the root of the source
- * tree. An additional intellectual property rights grant can be found
- * in the file PATENTS. All contributing project authors may
- * be found in the AUTHORS file in the root of the source tree.
- */
- #include "./vp8_rtcd.h"
- #include "vpx_ports/asmdefs_mmi.h"
- #define COPY_MEM_16X2 \
- "gsldlc1 %[ftmp0], 0x07(%[src]) \n\t" \
- "gsldrc1 %[ftmp0], 0x00(%[src]) \n\t" \
- "ldl %[tmp0], 0x0f(%[src]) \n\t" \
- "ldr %[tmp0], 0x08(%[src]) \n\t" \
- MMI_ADDU(%[src], %[src], %[src_stride]) \
- "gssdlc1 %[ftmp0], 0x07(%[dst]) \n\t" \
- "gssdrc1 %[ftmp0], 0x00(%[dst]) \n\t" \
- "sdl %[tmp0], 0x0f(%[dst]) \n\t" \
- "sdr %[tmp0], 0x08(%[dst]) \n\t" \
- MMI_ADDU(%[dst], %[dst], %[dst_stride]) \
- "gsldlc1 %[ftmp1], 0x07(%[src]) \n\t" \
- "gsldrc1 %[ftmp1], 0x00(%[src]) \n\t" \
- "ldl %[tmp1], 0x0f(%[src]) \n\t" \
- "ldr %[tmp1], 0x08(%[src]) \n\t" \
- MMI_ADDU(%[src], %[src], %[src_stride]) \
- "gssdlc1 %[ftmp1], 0x07(%[dst]) \n\t" \
- "gssdrc1 %[ftmp1], 0x00(%[dst]) \n\t" \
- "sdl %[tmp1], 0x0f(%[dst]) \n\t" \
- "sdr %[tmp1], 0x08(%[dst]) \n\t" \
- MMI_ADDU(%[dst], %[dst], %[dst_stride])
- #define COPY_MEM_8X2 \
- "gsldlc1 %[ftmp0], 0x07(%[src]) \n\t" \
- "gsldrc1 %[ftmp0], 0x00(%[src]) \n\t" \
- MMI_ADDU(%[src], %[src], %[src_stride]) \
- "ldl %[tmp0], 0x07(%[src]) \n\t" \
- "ldr %[tmp0], 0x00(%[src]) \n\t" \
- MMI_ADDU(%[src], %[src], %[src_stride]) \
- \
- "gssdlc1 %[ftmp0], 0x07(%[dst]) \n\t" \
- "gssdrc1 %[ftmp0], 0x00(%[dst]) \n\t" \
- MMI_ADDU(%[dst], %[dst], %[dst_stride]) \
- "sdl %[tmp0], 0x07(%[dst]) \n\t" \
- "sdr %[tmp0], 0x00(%[dst]) \n\t" \
- MMI_ADDU(%[dst], %[dst], %[dst_stride])
- void vp8_copy_mem16x16_mmi(unsigned char *src, int src_stride,
- unsigned char *dst, int dst_stride) {
- double ftmp[2];
- uint64_t tmp[2];
- uint8_t loop_count = 4;
- /* clang-format off */
- __asm__ volatile (
- "1: \n\t"
- COPY_MEM_16X2
- COPY_MEM_16X2
- MMI_ADDIU(%[loop_count], %[loop_count], -0x01)
- "bnez %[loop_count], 1b \n\t"
- : [ftmp0]"=&f"(ftmp[0]), [ftmp1]"=&f"(ftmp[1]),
- [tmp0]"=&r"(tmp[0]), [tmp1]"=&r"(tmp[1]),
- [loop_count]"+&r"(loop_count),
- [dst]"+&r"(dst), [src]"+&r"(src)
- : [src_stride]"r"((mips_reg)src_stride),
- [dst_stride]"r"((mips_reg)dst_stride)
- : "memory"
- );
- /* clang-format on */
- }
- void vp8_copy_mem8x8_mmi(unsigned char *src, int src_stride, unsigned char *dst,
- int dst_stride) {
- double ftmp[2];
- uint64_t tmp[1];
- uint8_t loop_count = 4;
- /* clang-format off */
- __asm__ volatile (
- "1: \n\t"
- COPY_MEM_8X2
- MMI_ADDIU(%[loop_count], %[loop_count], -0x01)
- "bnez %[loop_count], 1b \n\t"
- : [ftmp0]"=&f"(ftmp[0]), [ftmp1]"=&f"(ftmp[1]),
- [tmp0]"=&r"(tmp[0]), [loop_count]"+&r"(loop_count),
- [dst]"+&r"(dst), [src]"+&r"(src)
- : [src_stride]"r"((mips_reg)src_stride),
- [dst_stride]"r"((mips_reg)dst_stride)
- : "memory"
- );
- /* clang-format on */
- }
- void vp8_copy_mem8x4_mmi(unsigned char *src, int src_stride, unsigned char *dst,
- int dst_stride) {
- double ftmp[2];
- uint64_t tmp[1];
- /* clang-format off */
- __asm__ volatile (
- COPY_MEM_8X2
- COPY_MEM_8X2
- : [ftmp0]"=&f"(ftmp[0]), [ftmp1]"=&f"(ftmp[1]),
- [tmp0]"=&r"(tmp[0]),
- [dst]"+&r"(dst), [src]"+&r"(src)
- : [src_stride]"r"((mips_reg)src_stride),
- [dst_stride]"r"((mips_reg)dst_stride)
- : "memory"
- );
- /* clang-format on */
- }
|