Update contrib.
2 * LIBOIL - Library of Optimized Inner Loops
3 * Copyright (c) 2003,2004 David A. Schleef <ds@schleef.org>
6 * Redistribution and use in source and binary forms, with or without
7 * modification, are permitted provided that the following conditions
9 * 1. Redistributions of source code must retain the above copyright
10 * notice, this list of conditions and the following disclaimer.
11 * 2. Redistributions in binary form must reproduce the above copyright
12 * notice, this list of conditions and the following disclaimer in the
13 * documentation and/or other materials provided with the distribution.
15 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
16 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
17 * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
18 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT,
19 * INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
20 * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
21 * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
22 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
23 * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING
24 * IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
25 * POSSIBILITY OF SUCH DAMAGE.
27 //Portions Copyright (c) 2008-2009 Nokia Corporation and/or its subsidiary(-ies). All rights reserved.
33 #include <liboil/liboilfunction.h>
34 #include "liboil/simdpack/simdpack.h"
38 diffsquaresum_f64_i10_simple(double *dest, double *src1, int sstr1, double *src2,
46 x = OIL_GET(src1, i*sstr1, double) -
47 OIL_GET(src2, i*sstr2, double);
54 OIL_DEFINE_IMPL (diffsquaresum_f64_i10_simple, diffsquaresum_f64);
57 diffsquaresum_f64_i10_fast(double *dest, double *src1, int sstr1, double *src2,
66 OIL_INCREMENT (src1, sstr1);
67 OIL_INCREMENT (src2, sstr2);
73 OIL_DEFINE_IMPL (diffsquaresum_f64_i10_fast, diffsquaresum_f64);
76 diffsquaresum_f64_i10_unroll2(double *dest, double *src1, int sstr1, double *src2,
86 OIL_INCREMENT (src1, sstr1);
87 OIL_INCREMENT (src2, sstr2);
93 OIL_INCREMENT (src1, sstr1);
94 OIL_INCREMENT (src2, sstr2);
97 OIL_INCREMENT (src1, sstr1);
98 OIL_INCREMENT (src2, sstr2);
104 OIL_DEFINE_IMPL (diffsquaresum_f64_i10_unroll2, diffsquaresum_f64);
107 diffsquaresum_f64_i10_unroll4(double *dest, double *src1, int sstr1,
108 double *src2, int sstr2, int n)
119 OIL_INCREMENT (src1, sstr1);
120 OIL_INCREMENT (src2, sstr2);
126 OIL_INCREMENT (src1, sstr1);
127 OIL_INCREMENT (src2, sstr2);
130 OIL_INCREMENT (src1, sstr1);
131 OIL_INCREMENT (src2, sstr2);
134 OIL_INCREMENT (src1, sstr1);
135 OIL_INCREMENT (src2, sstr2);
138 OIL_INCREMENT (src1, sstr1);
139 OIL_INCREMENT (src2, sstr2);
143 *dest = sum0 + sum1 + sum2 + sum3;
145 OIL_DEFINE_IMPL (diffsquaresum_f64_i10_unroll4, diffsquaresum_f64);
152 OilFunctionImpl* __oil_function_impl_diffsquaresum_f64_i10_simple() {
153 return &_oil_function_impl_diffsquaresum_f64_i10_simple;
159 OilFunctionImpl* __oil_function_impl_diffsquaresum_f64_i10_fast() {
160 return &_oil_function_impl_diffsquaresum_f64_i10_fast;
166 OilFunctionImpl* __oil_function_impl_diffsquaresum_f64_i10_unroll2() {
167 return &_oil_function_impl_diffsquaresum_f64_i10_unroll2;
173 OilFunctionImpl* __oil_function_impl_diffsquaresum_f64_i10_unroll4() {
174 return &_oil_function_impl_diffsquaresum_f64_i10_unroll4;