sl@0: /* sl@0: * LIBOIL - Library of Optimized Inner Loops sl@0: * Copyright (c) 2003,2004 David A. Schleef sl@0: * All rights reserved. sl@0: * sl@0: * Redistribution and use in source and binary forms, with or without sl@0: * modification, are permitted provided that the following conditions sl@0: * are met: sl@0: * 1. Redistributions of source code must retain the above copyright sl@0: * notice, this list of conditions and the following disclaimer. sl@0: * 2. Redistributions in binary form must reproduce the above copyright sl@0: * notice, this list of conditions and the following disclaimer in the sl@0: * documentation and/or other materials provided with the distribution. sl@0: * sl@0: * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR sl@0: * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED sl@0: * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE sl@0: * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, sl@0: * INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES sl@0: * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR sl@0: * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) sl@0: * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, sl@0: * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING sl@0: * IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE sl@0: * POSSIBILITY OF SUCH DAMAGE. sl@0: */ sl@0: //Portions Copyright (c) 2008-2009 Nokia Corporation and/or its subsidiary(-ies). All rights reserved. sl@0: sl@0: #ifdef HAVE_CONFIG_H sl@0: #include "config.h" sl@0: #endif sl@0: sl@0: #include sl@0: #include "liboil/simdpack/simdpack.h" sl@0: #include sl@0: sl@0: sl@0: /** sl@0: * oil_sad8x8_u8: sl@0: * @d_1: sl@0: * @s1_8x8: sl@0: * @ss1: sl@0: * @s2_8x8: sl@0: * @ss2: sl@0: * sl@0: * Calculates the sum of absolute differences between elements in @s1_8x8 sl@0: * and @s2_8x8, and places the result in @d_1. sl@0: */ sl@0: OIL_DEFINE_CLASS (sad8x8_u8, sl@0: "uint32_t *d_1, uint8_t *s1_8x8, int ss1, uint8_t *s2_8x8, int ss2"); sl@0: /** sl@0: * oil_sad8x8_s16_2: sl@0: * @d_1: sl@0: * @s1_8x8: sl@0: * @ss1: sl@0: * @s2_8x8: sl@0: * @ss2: sl@0: * sl@0: * Calculates the sum of absolute differences between elements in @s1_8x8 sl@0: * and @s2_8x8, and places the result in @d_1. sl@0: */ sl@0: OIL_DEFINE_CLASS (sad8x8_s16_2, sl@0: "uint32_t *d_1, int16_t *s1_8x8, int ss1, int16_t *s2_8x8, int ss2"); sl@0: /** sl@0: * oil_sad8x8_f64_2: sl@0: * @d_1: sl@0: * @s1_8x8: sl@0: * @ss1: sl@0: * @s2_8x8: sl@0: * @ss2: sl@0: * sl@0: * Calculates the sum of absolute differences between elements in @s1_8x8 sl@0: * and @s2_8x8, and places the result in @d_1. sl@0: */ sl@0: OIL_DEFINE_CLASS (sad8x8_f64_2, sl@0: "double *d_1, double *s1_8x8, int ss1, double *s2_8x8, int ss2"); sl@0: /** sl@0: * oil_sad8x8_8xn_u8: sl@0: * @d_1: sl@0: * @s1_8x8: sl@0: * @ss1: sl@0: * @s2_8xnp7: sl@0: * @ss2: sl@0: * @n: sl@0: * sl@0: * Calculates the sum of absolute differences between elements in @s1_8x8 sl@0: * and the 8x8 block of array elements starting at row i in @s2_8x8, and sl@0: * places the result in @d_n. sl@0: */ sl@0: OIL_DEFINE_CLASS (sad8x8_8xn_u8, sl@0: "uint32_t *d_n, uint8_t *s1_8x8, int ss1, uint8_t *s2_8xnp7, int ss2, int n"); sl@0: sl@0: /** sl@0: * oil_sad12x12_u8: sl@0: * @d_1: sl@0: * @s1_12x12: sl@0: * @ss1: sl@0: * @s2_12x12: sl@0: * @ss2: sl@0: * sl@0: * Calculates the sum of absolute differences between elements in @s1_12x12 sl@0: * and @s2_12x12, and places the result in @d_1. sl@0: */ sl@0: OIL_DEFINE_CLASS (sad12x12_u8, sl@0: "uint32_t *d_1, uint8_t *s1_12x12, int ss1, uint8_t *s2_12x12, int ss2"); sl@0: /** sl@0: * oil_sad12x12_12xn_u8: sl@0: * @d_1: sl@0: * @s1_12x12: sl@0: * @ss1: sl@0: * @s2_12xnp11: sl@0: * @ss2: sl@0: * @n: sl@0: * sl@0: * Calculates the sum of absolute differences between elements in @s1_12x12 sl@0: * and the 12x12 block of array elements starting at row i in @s2_12x12, and sl@0: * places the result in @d_n. sl@0: */ sl@0: OIL_DEFINE_CLASS (sad12x12_12xn_u8, sl@0: "uint32_t *d_n, uint8_t *s1_12x12, int ss1, uint8_t *s2_12xnp11, int ss2, int n"); sl@0: /** sl@0: * oil_sad16x16_u8: sl@0: * @d_1: sl@0: * @s1_16x16: sl@0: * @ss1: sl@0: * @s2_16x16: sl@0: * @ss2: sl@0: * sl@0: * Calculates the sum of absolute differences between elements in @s1_16x16 sl@0: * and @s2_16x16, and places the result in @d_1. sl@0: */ sl@0: OIL_DEFINE_CLASS (sad16x16_u8, sl@0: "uint32_t *d_1, uint8_t *s1_16x16, int ss1, uint8_t *s2_16x16, int ss2"); sl@0: /** sl@0: * oil_sad16x16_16xn_u8: sl@0: * @d_1: sl@0: * @s1_16x16: sl@0: * @ss1: sl@0: * @s2_16xnp15: sl@0: * @ss2: sl@0: * @n: sl@0: * sl@0: * Calculates the sum of absolute differences between elements in @s1_16x16 sl@0: * and the 16x16 block of array elements starting at row i in @s2_16x16, and sl@0: * places the result in @d_n. sl@0: */ sl@0: OIL_DEFINE_CLASS (sad16x16_16xn_u8, sl@0: "uint32_t *d_n, uint8_t *s1_16x16, int ss1, uint8_t *s2_16xnp15, int ss2, int n"); sl@0: sl@0: sl@0: static void sl@0: sad8x8_f64_2_ref (double *dest, double *src1, int sstr1, double *src2, sl@0: int sstr2) sl@0: { sl@0: int i, j; sl@0: double sum; sl@0: sl@0: sum = 0; sl@0: for (i = 0; i < 8; i++) { sl@0: for (j = 0; j < 8; j++) { sl@0: sum += fabs (OIL_GET (src1, sstr1 * i + j * sizeof (double), double) - sl@0: OIL_GET (src2, sstr2 * i + j * sizeof (double), double)); sl@0: } sl@0: } sl@0: *dest = sum; sl@0: } sl@0: sl@0: OIL_DEFINE_IMPL_REF (sad8x8_f64_2_ref, sad8x8_f64_2); sl@0: sl@0: static void sl@0: sad8x8_s16_2_ref (uint32_t * dest, int16_t * src1, int sstr1, int16_t * src2, sl@0: int sstr2) sl@0: { sl@0: int i, j; sl@0: int d; sl@0: uint32_t sum; sl@0: sl@0: sum = 0; sl@0: for (i = 0; i < 8; i++) { sl@0: for (j = 0; j < 8; j++) { sl@0: d = ((int) OIL_GET (src1, sstr1 * i + j * sizeof (int16_t), int16_t)) - sl@0: ((int) OIL_GET (src2, sstr2 * i + j * sizeof (int16_t), int16_t)); sl@0: sum += (d < 0) ? -d : d; sl@0: } sl@0: } sl@0: *dest = sum; sl@0: } sl@0: OIL_DEFINE_IMPL_REF (sad8x8_s16_2_ref, sad8x8_s16_2); sl@0: sl@0: static void sl@0: sad8x8_u8_ref (uint32_t * dest, uint8_t * src1, int sstr1, uint8_t * src2, sl@0: int sstr2) sl@0: { sl@0: int i, j; sl@0: int d; sl@0: uint32_t sum; sl@0: sl@0: sum = 0; sl@0: for (i = 0; i < 8; i++) { sl@0: for (j = 0; j < 8; j++) { sl@0: d = ((int) OIL_GET (src1, sstr1 * i + j * sizeof (uint8_t), uint8_t)) - sl@0: ((int) OIL_GET (src2, sstr2 * i + j * sizeof (uint8_t), uint8_t)); sl@0: sum += (d < 0) ? -d : d; sl@0: } sl@0: } sl@0: *dest = sum; sl@0: } sl@0: OIL_DEFINE_IMPL_REF (sad8x8_u8_ref, sad8x8_u8); sl@0: sl@0: static void sl@0: sad8x8_8xn_u8_ref (uint32_t * dest, uint8_t * src1, int sstr1, uint8_t * src2, sl@0: int sstr2, int n) sl@0: { sl@0: int i, j, k; sl@0: int d; sl@0: uint32_t sum; sl@0: sl@0: for (i=0;ifunc; sl@0: } sl@0: #endif sl@0: sl@0: #ifdef __SYMBIAN32__ sl@0: sl@0: EXPORT_C void** _oil_function_class_ptr_sad8x8_s16_2 () { sl@0: oil_function_class_ptr_sad8x8_s16_2 = __oil_function_class_sad8x8_s16_2(); sl@0: return &oil_function_class_ptr_sad8x8_s16_2->func; sl@0: } sl@0: #endif sl@0: sl@0: #ifdef __SYMBIAN32__ sl@0: sl@0: EXPORT_C void** _oil_function_class_ptr_sad8x8_f64_2 () { sl@0: oil_function_class_ptr_sad8x8_f64_2 = __oil_function_class_sad8x8_f64_2(); sl@0: return &oil_function_class_ptr_sad8x8_f64_2->func; sl@0: } sl@0: #endif sl@0: sl@0: #ifdef __SYMBIAN32__ sl@0: sl@0: EXPORT_C void** _oil_function_class_ptr_sad8x8_8xn_u8 () { sl@0: oil_function_class_ptr_sad8x8_8xn_u8 = __oil_function_class_sad8x8_8xn_u8(); sl@0: return &oil_function_class_ptr_sad8x8_8xn_u8->func; sl@0: } sl@0: #endif sl@0: sl@0: #ifdef __SYMBIAN32__ sl@0: sl@0: EXPORT_C void** _oil_function_class_ptr_sad12x12_u8 () { sl@0: oil_function_class_ptr_sad12x12_u8 = __oil_function_class_sad12x12_u8(); sl@0: return &oil_function_class_ptr_sad12x12_u8->func; sl@0: } sl@0: #endif sl@0: sl@0: #ifdef __SYMBIAN32__ sl@0: sl@0: EXPORT_C void** _oil_function_class_ptr_sad12x12_12xn_u8 () { sl@0: oil_function_class_ptr_sad12x12_12xn_u8 = __oil_function_class_sad12x12_12xn_u8(); sl@0: return &oil_function_class_ptr_sad12x12_12xn_u8->func; sl@0: } sl@0: #endif sl@0: sl@0: #ifdef __SYMBIAN32__ sl@0: sl@0: EXPORT_C void** _oil_function_class_ptr_sad16x16_u8 () { sl@0: oil_function_class_ptr_sad16x16_u8 = __oil_function_class_sad16x16_u8(); sl@0: return &oil_function_class_ptr_sad16x16_u8->func; sl@0: } sl@0: #endif sl@0: sl@0: #ifdef __SYMBIAN32__ sl@0: sl@0: EXPORT_C void** _oil_function_class_ptr_sad16x16_16xn_u8 () { sl@0: oil_function_class_ptr_sad16x16_16xn_u8 = __oil_function_class_sad16x16_16xn_u8(); sl@0: return &oil_function_class_ptr_sad16x16_16xn_u8->func; sl@0: } sl@0: #endif sl@0: