1.1 --- /dev/null Thu Jan 01 00:00:00 1970 +0000
1.2 +++ b/os/ossrv/genericopenlibs/liboil/src/simdpack/abs_misc.c Fri Jun 15 03:10:57 2012 +0200
1.3 @@ -0,0 +1,151 @@
1.4 +/*
1.5 + * LIBOIL - Library of Optimized Inner Loops
1.6 + * Copyright (c) 2003,2004 David A. Schleef <ds@schleef.org>
1.7 + * All rights reserved.
1.8 + *
1.9 + * Redistribution and use in source and binary forms, with or without
1.10 + * modification, are permitted provided that the following conditions
1.11 + * are met:
1.12 + * 1. Redistributions of source code must retain the above copyright
1.13 + * notice, this list of conditions and the following disclaimer.
1.14 + * 2. Redistributions in binary form must reproduce the above copyright
1.15 + * notice, this list of conditions and the following disclaimer in the
1.16 + * documentation and/or other materials provided with the distribution.
1.17 + *
1.18 + * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
1.19 + * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
1.20 + * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
1.21 + * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT,
1.22 + * INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
1.23 + * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
1.24 + * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
1.25 + * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
1.26 + * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING
1.27 + * IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
1.28 + * POSSIBILITY OF SUCH DAMAGE.
1.29 + */
1.30 +//Portions Copyright (c) 2008-2009 Nokia Corporation and/or its subsidiary(-ies). All rights reserved.
1.31 +
1.32 +#ifdef HAVE_CONFIG_H
1.33 +#include "config.h"
1.34 +#endif
1.35 +
1.36 +#include <liboil/liboilfunction.h>
1.37 +#include "liboil/simdpack/simdpack.h"
1.38 +
1.39 +#define ABS(x) ((x)>0 ? (x) : -(x))
1.40 +
1.41 +static void
1.42 +abs_u16_s16_unroll2 (uint16_t * dest, int dstr, int16_t * src, int sstr, int n)
1.43 +{
1.44 + while (n & 1) {
1.45 + *dest = ABS (*src);
1.46 + OIL_INCREMENT (dest, dstr);
1.47 + OIL_INCREMENT (src, sstr);
1.48 + n--;
1.49 + }
1.50 + while (n > 0) {
1.51 + *dest = ABS (*src);
1.52 + OIL_INCREMENT (dest, dstr);
1.53 + OIL_INCREMENT (src, sstr);
1.54 + *dest = ABS (*src);
1.55 + OIL_INCREMENT (dest, dstr);
1.56 + OIL_INCREMENT (src, sstr);
1.57 + n -= 2;
1.58 + }
1.59 +}
1.60 +OIL_DEFINE_IMPL (abs_u16_s16_unroll2, abs_u16_s16);
1.61 +
1.62 +static void
1.63 +abs_u16_s16_unroll4 (uint16_t * dest, int dstr, int16_t * src, int sstr, int n)
1.64 +{
1.65 + while (n & 3) {
1.66 + *dest = ABS (*src);
1.67 + OIL_INCREMENT (dest, dstr);
1.68 + OIL_INCREMENT (src, sstr);
1.69 + n--;
1.70 + }
1.71 + while (n > 0) {
1.72 + *dest = ABS (*src);
1.73 + OIL_INCREMENT (dest, dstr);
1.74 + OIL_INCREMENT (src, sstr);
1.75 + *dest = ABS (*src);
1.76 + OIL_INCREMENT (dest, dstr);
1.77 + OIL_INCREMENT (src, sstr);
1.78 + *dest = ABS (*src);
1.79 + OIL_INCREMENT (dest, dstr);
1.80 + OIL_INCREMENT (src, sstr);
1.81 + *dest = ABS (*src);
1.82 + OIL_INCREMENT (dest, dstr);
1.83 + OIL_INCREMENT (src, sstr);
1.84 + n -= 4;
1.85 + }
1.86 +}
1.87 +OIL_DEFINE_IMPL (abs_u16_s16_unroll4, abs_u16_s16);
1.88 +
1.89 +static void
1.90 +abs_u16_s16_fast (uint16_t * dest, int dstr, int16_t * src, int sstr, int n)
1.91 +{
1.92 + int i;
1.93 + int16_t x, y;
1.94 +
1.95 + for (i = 0; i < n; i++) {
1.96 + x = *src;
1.97 + y = ((x >> 15) & x);
1.98 + *dest = x - y - y;
1.99 + OIL_INCREMENT (dest, dstr);
1.100 + OIL_INCREMENT (src, sstr);
1.101 + }
1.102 +}
1.103 +
1.104 +OIL_DEFINE_IMPL (abs_u16_s16_fast, abs_u16_s16);
1.105 +
1.106 +
1.107 +/* Similar algorithm as clipping, but for absolute value. Note the stunt
1.108 + * pulled to get around 2*y rolling over. */
1.109 +
1.110 +static void
1.111 +abs_u32_s32_fast (uint32_t * dest, int dstr, int32_t * src, int sstr, int n)
1.112 +{
1.113 + int i;
1.114 + int32_t x, y;
1.115 +
1.116 + for (i = 0; i < n; i++) {
1.117 + x = OIL_GET(src, i * sstr, int32_t);
1.118 + y = ((x >> 31) & x);
1.119 + OIL_GET(dest, i * dstr, uint32_t) = x - y - y;
1.120 + }
1.121 +}
1.122 +
1.123 +OIL_DEFINE_IMPL (abs_u32_s32_fast, abs_u32_s32);
1.124 +
1.125 +
1.126 +
1.127 +#ifdef __SYMBIAN32__
1.128 +
1.129 +OilFunctionImpl* __oil_function_impl_abs_u16_s16_unroll2() {
1.130 + return &_oil_function_impl_abs_u16_s16_unroll2;
1.131 +}
1.132 +#endif
1.133 +
1.134 +#ifdef __SYMBIAN32__
1.135 +
1.136 +OilFunctionImpl* __oil_function_impl_abs_u16_s16_unroll4() {
1.137 + return &_oil_function_impl_abs_u16_s16_unroll4;
1.138 +}
1.139 +#endif
1.140 +
1.141 +#ifdef __SYMBIAN32__
1.142 +
1.143 +OilFunctionImpl* __oil_function_impl_abs_u16_s16_fast() {
1.144 + return &_oil_function_impl_abs_u16_s16_fast;
1.145 +}
1.146 +#endif
1.147 +
1.148 +#ifdef __SYMBIAN32__
1.149 +
1.150 +OilFunctionImpl* __oil_function_impl_abs_u32_s32_fast() {
1.151 + return &_oil_function_impl_abs_u32_s32_fast;
1.152 +}
1.153 +#endif
1.154 +