Update contrib.
2 * LIBOIL - Library of Optimized Inner Loops
3 * Copyright (c) 2003,2004 David A. Schleef <ds@schleef.org>
6 * Redistribution and use in source and binary forms, with or without
7 * modification, are permitted provided that the following conditions
9 * 1. Redistributions of source code must retain the above copyright
10 * notice, this list of conditions and the following disclaimer.
11 * 2. Redistributions in binary form must reproduce the above copyright
12 * notice, this list of conditions and the following disclaimer in the
13 * documentation and/or other materials provided with the distribution.
15 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
16 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
17 * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
18 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT,
19 * INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
20 * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
21 * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
22 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
23 * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING
24 * IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
25 * POSSIBILITY OF SUCH DAMAGE.
27 //Portions Copyright (c) 2008-2009 Nokia Corporation and/or its subsidiary(-ies). All rights reserved.
33 #include <liboil/liboilfunction.h>
34 #include "liboil/simdpack/simdpack.h"
39 average2_u8_trick (uint8_t * dest, int dstr, uint8_t *src1, int sstr1,
40 uint8_t *src2, int sstr2, int n)
45 *dest = (*src1 + *src2) >> 1;
52 x = (src1[0] << 24) | (src1[sstr1] << 16) | (src1[2 *
53 sstr1] << 8) | (src1[3 * sstr1]);
54 y = (src2[0] << 24) | (src2[sstr2] << 16) | (src2[2 *
55 sstr2] << 8) | (src2[3 * sstr2]);
56 d = (((x ^ y) & 0xfefefefe) >> 1) + (x & y);
58 dest[1*dstr] = (d >> 16);
59 dest[2*dstr] = (d >> 8);
60 dest[3*dstr] = (d >> 0);
68 OIL_DEFINE_IMPL (average2_u8_trick, average2_u8);
71 average2_u8_fast (uint8_t * dest, int dstr, uint8_t *src1, int sstr1,
72 uint8_t *src2, int sstr2, int n)
75 *dest = (*src1 + *src2) >> 1;
83 OIL_DEFINE_IMPL (average2_u8_fast, average2_u8);
86 average2_u8_unroll4 (uint8_t * dest, int dstr, uint8_t *src1, int sstr1,
87 uint8_t *src2, int sstr2, int n)
90 *dest = (*src1 + *src2) >> 1;
97 *dest = (*src1 + *src2) >> 1;
101 *dest = (*src1 + *src2) >> 1;
105 *dest = (*src1 + *src2) >> 1;
109 *dest = (*src1 + *src2) >> 1;
117 OIL_DEFINE_IMPL (average2_u8_unroll4, average2_u8);
123 OilFunctionImpl* __oil_function_impl_average2_u8_trick() {
124 return &_oil_function_impl_average2_u8_trick;
130 OilFunctionImpl* __oil_function_impl_average2_u8_fast() {
131 return &_oil_function_impl_average2_u8_fast;
137 OilFunctionImpl* __oil_function_impl_average2_u8_unroll4() {
138 return &_oil_function_impl_average2_u8_unroll4;