float_dsp_mips.c 4.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113
  1. /*
  2. * Copyright (c) 2012
  3. * MIPS Technologies, Inc., California.
  4. *
  5. * Redistribution and use in source and binary forms, with or without
  6. * modification, are permitted provided that the following conditions
  7. * are met:
  8. * 1. Redistributions of source code must retain the above copyright
  9. * notice, this list of conditions and the following disclaimer.
  10. * 2. Redistributions in binary form must reproduce the above copyright
  11. * notice, this list of conditions and the following disclaimer in the
  12. * documentation and/or other materials provided with the distribution.
  13. * 3. Neither the name of the MIPS Technologies, Inc., nor the names of its
  14. * contributors may be used to endorse or promote products derived from
  15. * this software without specific prior written permission.
  16. *
  17. * THIS SOFTWARE IS PROVIDED BY THE MIPS TECHNOLOGIES, INC. ``AS IS'' AND
  18. * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  19. * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  20. * ARE DISCLAIMED. IN NO EVENT SHALL THE MIPS TECHNOLOGIES, INC. BE LIABLE
  21. * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  22. * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  23. * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  24. * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  25. * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  26. * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  27. * SUCH DAMAGE.
  28. *
  29. * Author: Branimir Vasic (bvasic@mips.com)
  30. *
  31. * This file is part of FFmpeg.
  32. *
  33. * FFmpeg is free software; you can redistribute it and/or
  34. * modify it under the terms of the GNU Lesser General Public
  35. * License as published by the Free Software Foundation; either
  36. * version 2.1 of the License, or (at your option) any later version.
  37. *
  38. * FFmpeg is distributed in the hope that it will be useful,
  39. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  40. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  41. * Lesser General Public License for more details.
  42. *
  43. * You should have received a copy of the GNU Lesser General Public
  44. * License along with FFmpeg; if not, write to the Free Software
  45. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  46. */
  47. /**
  48. * @file
  49. * Reference: libavutil/float_dsp.c
  50. */
  51. #include "config.h"
  52. #include "libavutil/float_dsp.h"
  53. #if HAVE_INLINE_ASM && HAVE_MIPSFPU
  54. static void vector_fmul_mips(float *dst, const float *src0, const float *src1,
  55. int len)
  56. {
  57. int i;
  58. if (len & 3) {
  59. for (i = 0; i < len; i++)
  60. dst[i] = src0[i] * src1[i];
  61. } else {
  62. float *d = (float *)dst;
  63. float *d_end = d + len;
  64. float *s0 = (float *)src0;
  65. float *s1 = (float *)src1;
  66. float src0_0, src0_1, src0_2, src0_3;
  67. float src1_0, src1_1, src1_2, src1_3;
  68. __asm__ volatile (
  69. "1: \n\t"
  70. "lwc1 %[src0_0], 0(%[s0]) \n\t"
  71. "lwc1 %[src1_0], 0(%[s1]) \n\t"
  72. "lwc1 %[src0_1], 4(%[s0]) \n\t"
  73. "lwc1 %[src1_1], 4(%[s1]) \n\t"
  74. "lwc1 %[src0_2], 8(%[s0]) \n\t"
  75. "lwc1 %[src1_2], 8(%[s1]) \n\t"
  76. "lwc1 %[src0_3], 12(%[s0]) \n\t"
  77. "lwc1 %[src1_3], 12(%[s1]) \n\t"
  78. "mul.s %[src0_0], %[src0_0], %[src1_0] \n\t"
  79. "mul.s %[src0_1], %[src0_1], %[src1_1] \n\t"
  80. "mul.s %[src0_2], %[src0_2], %[src1_2] \n\t"
  81. "mul.s %[src0_3], %[src0_3], %[src1_3] \n\t"
  82. "swc1 %[src0_0], 0(%[d]) \n\t"
  83. "swc1 %[src0_1], 4(%[d]) \n\t"
  84. "swc1 %[src0_2], 8(%[d]) \n\t"
  85. "swc1 %[src0_3], 12(%[d]) \n\t"
  86. "addiu %[s0], %[s0], 16 \n\t"
  87. "addiu %[s1], %[s1], 16 \n\t"
  88. "addiu %[d], %[d], 16 \n\t"
  89. "bne %[d], %[d_end], 1b \n\t"
  90. : [src0_0]"=&f"(src0_0), [src0_1]"=&f"(src0_1),
  91. [src0_2]"=&f"(src0_2), [src0_3]"=&f"(src0_3),
  92. [src1_0]"=&f"(src1_0), [src1_1]"=&f"(src1_1),
  93. [src1_2]"=&f"(src1_2), [src1_3]"=&f"(src1_3),
  94. [d]"+r"(d), [s0]"+r"(s0), [s1]"+r"(s1)
  95. : [d_end]"r"(d_end)
  96. : "memory"
  97. );
  98. }
  99. }
  100. #endif /* HAVE_INLINE_ASM && HAVE_MIPSFPU */
  101. void ff_float_dsp_init_mips(AVFloatDSPContext *fdsp) {
  102. #if HAVE_INLINE_ASM && HAVE_MIPSFPU
  103. fdsp->vector_fmul = vector_fmul_mips;
  104. #endif /* HAVE_INLINE_ASM && HAVE_MIPSFPU */
  105. }