os/ossrv/genericopenlibs/liboil/src/simdpack/scalarmult.c
author sl
Tue, 10 Jun 2014 14:32:02 +0200
changeset 1 260cb5ec6c19
permissions -rw-r--r--
Update contrib.
sl@0
     1
/*
sl@0
     2
 * LIBOIL - Library of Optimized Inner Loops
sl@0
     3
 * Copyright (c) 2003,2004 David A. Schleef <ds@schleef.org>
sl@0
     4
 * All rights reserved.
sl@0
     5
 *
sl@0
     6
 * Redistribution and use in source and binary forms, with or without
sl@0
     7
 * modification, are permitted provided that the following conditions
sl@0
     8
 * are met:
sl@0
     9
 * 1. Redistributions of source code must retain the above copyright
sl@0
    10
 *    notice, this list of conditions and the following disclaimer.
sl@0
    11
 * 2. Redistributions in binary form must reproduce the above copyright
sl@0
    12
 *    notice, this list of conditions and the following disclaimer in the
sl@0
    13
 *    documentation and/or other materials provided with the distribution.
sl@0
    14
 * 
sl@0
    15
 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
sl@0
    16
 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
sl@0
    17
 * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
sl@0
    18
 * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT,
sl@0
    19
 * INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
sl@0
    20
 * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
sl@0
    21
 * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
sl@0
    22
 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
sl@0
    23
 * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING
sl@0
    24
 * IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
sl@0
    25
 * POSSIBILITY OF SUCH DAMAGE.
sl@0
    26
 */
sl@0
    27
//Portions Copyright (c)  2008-2009 Nokia Corporation and/or its subsidiary(-ies). All rights reserved. 
sl@0
    28
sl@0
    29
#ifdef HAVE_CONFIG_H
sl@0
    30
#include "config.h"
sl@0
    31
#endif
sl@0
    32
sl@0
    33
#include <liboil/liboilfunction.h>
sl@0
    34
#include "liboil/simdpack/simdpack.h"
sl@0
    35
sl@0
    36
#ifdef __SYMBIAN32__
sl@0
    37
#ifdef __WINSCW__
sl@0
    38
#pragma warn_emptydecl off
sl@0
    39
#endif//__WINSCW__
sl@0
    40
#endif//__SYMBIAN32__
sl@0
    41
sl@0
    42
#define SCALARMULT_DEFINE_UNROLL2(type)		\
sl@0
    43
static void scalarmult_ ## type ## _unroll2(	\
sl@0
    44
    oil_type_ ## type *dest, int dstr,		\
sl@0
    45
    oil_type_ ## type *src, int sstr,		\
sl@0
    46
    oil_type_ ## type *val, int n)			\
sl@0
    47
{						\
sl@0
    48
  if(n&1) {					\
sl@0
    49
    *dest = *src * *val;			\
sl@0
    50
    OIL_INCREMENT(dest, dstr);			\
sl@0
    51
    OIL_INCREMENT(src, sstr);			\
sl@0
    52
  }						\
sl@0
    53
  n /= 2;					\
sl@0
    54
  while(n>0){					\
sl@0
    55
    *dest = *src * *val;			\
sl@0
    56
    OIL_INCREMENT(dest,dstr);			\
sl@0
    57
    OIL_INCREMENT(src,sstr);			\
sl@0
    58
    *dest = *src * *val;			\
sl@0
    59
    OIL_INCREMENT(dest,dstr);			\
sl@0
    60
    OIL_INCREMENT(src,sstr);			\
sl@0
    61
    n--;					\
sl@0
    62
  }						\
sl@0
    63
}						\
sl@0
    64
OIL_DEFINE_IMPL (scalarmult_ ## type ## _unroll2, scalarmult_ ## type);
sl@0
    65
sl@0
    66
SCALARMULT_DEFINE_UNROLL2 (s8);
sl@0
    67
SCALARMULT_DEFINE_UNROLL2 (u8);
sl@0
    68
SCALARMULT_DEFINE_UNROLL2 (s16);
sl@0
    69
SCALARMULT_DEFINE_UNROLL2 (u16);
sl@0
    70
SCALARMULT_DEFINE_UNROLL2 (s32);
sl@0
    71
SCALARMULT_DEFINE_UNROLL2 (u32);
sl@0
    72
SCALARMULT_DEFINE_UNROLL2 (f32);
sl@0
    73
SCALARMULT_DEFINE_UNROLL2 (f64);
sl@0
    74
sl@0
    75
#define SCALARMULT_DEFINE_UNROLL2x(type)	\
sl@0
    76
static void scalarmult_ ## type ## _unroll2x(	\
sl@0
    77
    oil_type_ ## type *dest, int dstr,		\
sl@0
    78
    oil_type_ ## type *src, int sstr,		\
sl@0
    79
    oil_type_ ## type *val, int n)			\
sl@0
    80
{						\
sl@0
    81
  oil_type_ ## type *dest2;				\
sl@0
    82
  oil_type_ ## type *src2;				\
sl@0
    83
  int i;					\
sl@0
    84
  if(n&1) {					\
sl@0
    85
    *dest = *src * *val;			\
sl@0
    86
    OIL_INCREMENT(dest, dstr);			\
sl@0
    87
    OIL_INCREMENT(src, sstr);			\
sl@0
    88
  }						\
sl@0
    89
  src2 = OIL_OFFSET(src, sstr);			\
sl@0
    90
  dest2 = OIL_OFFSET(dest, dstr);		\
sl@0
    91
  n /= 2;					\
sl@0
    92
  sstr *= 2;					\
sl@0
    93
  dstr *= 2;					\
sl@0
    94
  for(i=0;i<n;i++){				\
sl@0
    95
    OIL_GET(dest,dstr*i,oil_type_ ## type) = OIL_GET(src,sstr*i,oil_type_ ## type) * *val; \
sl@0
    96
    OIL_GET(dest2,dstr*i,oil_type_ ## type) = OIL_GET(src2,sstr*i,oil_type_ ## type) * *val; \
sl@0
    97
  }						\
sl@0
    98
}						\
sl@0
    99
OIL_DEFINE_IMPL (scalarmult_ ## type ## _unroll2x, scalarmult_ ## type);
sl@0
   100
sl@0
   101
SCALARMULT_DEFINE_UNROLL2x (s8);
sl@0
   102
SCALARMULT_DEFINE_UNROLL2x (u8);
sl@0
   103
SCALARMULT_DEFINE_UNROLL2x (s16);
sl@0
   104
SCALARMULT_DEFINE_UNROLL2x (u16);
sl@0
   105
SCALARMULT_DEFINE_UNROLL2x (s32);
sl@0
   106
SCALARMULT_DEFINE_UNROLL2x (u32);
sl@0
   107
SCALARMULT_DEFINE_UNROLL2x (f32);
sl@0
   108
SCALARMULT_DEFINE_UNROLL2x (f64);
sl@0
   109
sl@0
   110
#define SCALARMULT_DEFINE_UNROLL4(type)		\
sl@0
   111
static void scalarmult_ ## type ## _unroll4(	\
sl@0
   112
    oil_type_ ## type *dest, int dstr,		\
sl@0
   113
    oil_type_ ## type *src, int sstr,		\
sl@0
   114
    oil_type_ ## type *val, int n)			\
sl@0
   115
{						\
sl@0
   116
  if(n&1) {					\
sl@0
   117
    *dest = *src * *val;			\
sl@0
   118
    OIL_INCREMENT(dest, dstr);			\
sl@0
   119
    OIL_INCREMENT(src, sstr);			\
sl@0
   120
  }						\
sl@0
   121
  if(n&2) {					\
sl@0
   122
    *dest = *src * *val;			\
sl@0
   123
    OIL_INCREMENT(dest, dstr);			\
sl@0
   124
    OIL_INCREMENT(src, sstr);			\
sl@0
   125
    *dest = *src * *val;			\
sl@0
   126
    OIL_INCREMENT(dest, dstr);			\
sl@0
   127
    OIL_INCREMENT(src, sstr);			\
sl@0
   128
  }						\
sl@0
   129
  n /= 4;					\
sl@0
   130
  while(n>0){					\
sl@0
   131
    *dest = *src * *val;			\
sl@0
   132
    OIL_INCREMENT(dest,dstr);			\
sl@0
   133
    OIL_INCREMENT(src,sstr);			\
sl@0
   134
    *dest = *src * *val;			\
sl@0
   135
    OIL_INCREMENT(dest,dstr);			\
sl@0
   136
    OIL_INCREMENT(src,sstr);			\
sl@0
   137
    *dest = *src * *val;			\
sl@0
   138
    OIL_INCREMENT(dest,dstr);			\
sl@0
   139
    OIL_INCREMENT(src,sstr);			\
sl@0
   140
    *dest = *src * *val;			\
sl@0
   141
    OIL_INCREMENT(dest,dstr);			\
sl@0
   142
    OIL_INCREMENT(src,sstr);			\
sl@0
   143
    n--;					\
sl@0
   144
  }						\
sl@0
   145
}						\
sl@0
   146
OIL_DEFINE_IMPL (scalarmult_ ## type ## _unroll4, scalarmult_ ## type);
sl@0
   147
sl@0
   148
SCALARMULT_DEFINE_UNROLL4 (s8);
sl@0
   149
SCALARMULT_DEFINE_UNROLL4 (u8);
sl@0
   150
SCALARMULT_DEFINE_UNROLL4 (s16);
sl@0
   151
SCALARMULT_DEFINE_UNROLL4 (u16);
sl@0
   152
SCALARMULT_DEFINE_UNROLL4 (s32);
sl@0
   153
SCALARMULT_DEFINE_UNROLL4 (u32);
sl@0
   154
SCALARMULT_DEFINE_UNROLL4 (f32);
sl@0
   155
SCALARMULT_DEFINE_UNROLL4 (f64);
sl@0
   156
sl@0
   157
sl@0
   158
sl@0
   159
sl@0
   160
sl@0
   161
#define SCALARMULT_DEFINE_X(type)		\
sl@0
   162
static void scalarmult_ ## type ## _x(	\
sl@0
   163
    oil_type_ ## type *dest, int dstr,		\
sl@0
   164
    oil_type_ ## type *src, int sstr,		\
sl@0
   165
    oil_type_ ## type *val, int n)			\
sl@0
   166
{						\
sl@0
   167
  int i;					\
sl@0
   168
  for(i=0;i+1<n;i+=2){				\
sl@0
   169
    OIL_GET(dest, i*dstr,oil_type_ ## type) =        \
sl@0
   170
      OIL_GET(src, i*sstr,oil_type_ ## type) * *val; \
sl@0
   171
    OIL_GET(dest,(i+1)*dstr,oil_type_ ## type) =        \
sl@0
   172
      OIL_GET(src,(i+1)*sstr,oil_type_ ## type) * *val; \
sl@0
   173
  }						\
sl@0
   174
  if (n&1) {                                    \
sl@0
   175
    OIL_GET(dest,i*dstr,oil_type_ ## type) =        \
sl@0
   176
      OIL_GET(src,i*sstr,oil_type_ ## type) * *val; \
sl@0
   177
  }                                             \
sl@0
   178
}						\
sl@0
   179
OIL_DEFINE_IMPL (scalarmult_ ## type ## _x, scalarmult_ ## type);
sl@0
   180
sl@0
   181
sl@0
   182
SCALARMULT_DEFINE_X (s8);
sl@0
   183
SCALARMULT_DEFINE_X (u8);
sl@0
   184
SCALARMULT_DEFINE_X (s16);
sl@0
   185
SCALARMULT_DEFINE_X (u16);
sl@0
   186
SCALARMULT_DEFINE_X (s32);
sl@0
   187
SCALARMULT_DEFINE_X (u32);
sl@0
   188
SCALARMULT_DEFINE_X (f32);
sl@0
   189
SCALARMULT_DEFINE_X (f64);
sl@0
   190
sl@0
   191
#ifdef	__SYMBIAN32__
sl@0
   192
 
sl@0
   193
OilFunctionImpl* __oil_function_impl_scalarmult_s8_unroll2() {
sl@0
   194
        return &_oil_function_impl_scalarmult_s8_unroll2;
sl@0
   195
}
sl@0
   196
#endif
sl@0
   197
sl@0
   198
#ifdef	__SYMBIAN32__
sl@0
   199
 
sl@0
   200
OilFunctionImpl* __oil_function_impl_scalarmult_u8_unroll2() {
sl@0
   201
        return &_oil_function_impl_scalarmult_u8_unroll2;
sl@0
   202
}
sl@0
   203
#endif
sl@0
   204
sl@0
   205
#ifdef	__SYMBIAN32__
sl@0
   206
 
sl@0
   207
OilFunctionImpl* __oil_function_impl_scalarmult_s16_unroll2() {
sl@0
   208
        return &_oil_function_impl_scalarmult_s16_unroll2;
sl@0
   209
}
sl@0
   210
#endif
sl@0
   211
sl@0
   212
#ifdef	__SYMBIAN32__
sl@0
   213
 
sl@0
   214
OilFunctionImpl* __oil_function_impl_scalarmult_u16_unroll2() {
sl@0
   215
        return &_oil_function_impl_scalarmult_u16_unroll2;
sl@0
   216
}
sl@0
   217
#endif
sl@0
   218
sl@0
   219
#ifdef	__SYMBIAN32__
sl@0
   220
 
sl@0
   221
OilFunctionImpl* __oil_function_impl_scalarmult_s32_unroll2() {
sl@0
   222
        return &_oil_function_impl_scalarmult_s32_unroll2;
sl@0
   223
}
sl@0
   224
#endif
sl@0
   225
sl@0
   226
#ifdef	__SYMBIAN32__
sl@0
   227
 
sl@0
   228
OilFunctionImpl* __oil_function_impl_scalarmult_u32_unroll2() {
sl@0
   229
        return &_oil_function_impl_scalarmult_u32_unroll2;
sl@0
   230
}
sl@0
   231
#endif
sl@0
   232
sl@0
   233
#ifdef	__SYMBIAN32__
sl@0
   234
 
sl@0
   235
OilFunctionImpl* __oil_function_impl_scalarmult_f32_unroll2() {
sl@0
   236
        return &_oil_function_impl_scalarmult_f32_unroll2;
sl@0
   237
}
sl@0
   238
#endif
sl@0
   239
sl@0
   240
#ifdef	__SYMBIAN32__
sl@0
   241
 
sl@0
   242
OilFunctionImpl* __oil_function_impl_scalarmult_f64_unroll2() {
sl@0
   243
        return &_oil_function_impl_scalarmult_f64_unroll2;
sl@0
   244
}
sl@0
   245
#endif
sl@0
   246
sl@0
   247
#ifdef	__SYMBIAN32__
sl@0
   248
 
sl@0
   249
OilFunctionImpl* __oil_function_impl_scalarmult_s8_unroll4() {
sl@0
   250
        return &_oil_function_impl_scalarmult_s8_unroll4;
sl@0
   251
}
sl@0
   252
#endif
sl@0
   253
sl@0
   254
#ifdef	__SYMBIAN32__
sl@0
   255
 
sl@0
   256
OilFunctionImpl* __oil_function_impl_scalarmult_u8_unroll4() {
sl@0
   257
        return &_oil_function_impl_scalarmult_u8_unroll4;
sl@0
   258
}
sl@0
   259
#endif
sl@0
   260
sl@0
   261
#ifdef	__SYMBIAN32__
sl@0
   262
 
sl@0
   263
OilFunctionImpl* __oil_function_impl_scalarmult_s16_unroll4() {
sl@0
   264
        return &_oil_function_impl_scalarmult_s16_unroll4;
sl@0
   265
}
sl@0
   266
#endif
sl@0
   267
sl@0
   268
#ifdef	__SYMBIAN32__
sl@0
   269
 
sl@0
   270
OilFunctionImpl* __oil_function_impl_scalarmult_u16_unroll4() {
sl@0
   271
        return &_oil_function_impl_scalarmult_u16_unroll4;
sl@0
   272
}
sl@0
   273
#endif
sl@0
   274
sl@0
   275
#ifdef	__SYMBIAN32__
sl@0
   276
 
sl@0
   277
OilFunctionImpl* __oil_function_impl_scalarmult_s32_unroll4() {
sl@0
   278
        return &_oil_function_impl_scalarmult_s32_unroll4;
sl@0
   279
}
sl@0
   280
#endif
sl@0
   281
sl@0
   282
#ifdef	__SYMBIAN32__
sl@0
   283
 
sl@0
   284
OilFunctionImpl* __oil_function_impl_scalarmult_u32_unroll4() {
sl@0
   285
        return &_oil_function_impl_scalarmult_u32_unroll4;
sl@0
   286
}
sl@0
   287
#endif
sl@0
   288
sl@0
   289
#ifdef	__SYMBIAN32__
sl@0
   290
 
sl@0
   291
OilFunctionImpl* __oil_function_impl_scalarmult_f32_unroll4() {
sl@0
   292
        return &_oil_function_impl_scalarmult_f32_unroll4;
sl@0
   293
}
sl@0
   294
#endif
sl@0
   295
sl@0
   296
#ifdef	__SYMBIAN32__
sl@0
   297
 
sl@0
   298
OilFunctionImpl* __oil_function_impl_scalarmult_f64_unroll4() {
sl@0
   299
        return &_oil_function_impl_scalarmult_f64_unroll4;
sl@0
   300
}
sl@0
   301
#endif
sl@0
   302
sl@0
   303
#ifdef	__SYMBIAN32__
sl@0
   304
 
sl@0
   305
OilFunctionImpl* __oil_function_impl_scalarmult_s8_unroll2x() {
sl@0
   306
        return &_oil_function_impl_scalarmult_s8_unroll2x;
sl@0
   307
}
sl@0
   308
#endif
sl@0
   309
sl@0
   310
#ifdef	__SYMBIAN32__
sl@0
   311
 
sl@0
   312
OilFunctionImpl* __oil_function_impl_scalarmult_u8_unroll2x() {
sl@0
   313
        return &_oil_function_impl_scalarmult_u8_unroll2x;
sl@0
   314
}
sl@0
   315
#endif
sl@0
   316
sl@0
   317
#ifdef	__SYMBIAN32__
sl@0
   318
 
sl@0
   319
OilFunctionImpl* __oil_function_impl_scalarmult_s16_unroll2x() {
sl@0
   320
        return &_oil_function_impl_scalarmult_s16_unroll2x;
sl@0
   321
}
sl@0
   322
#endif
sl@0
   323
sl@0
   324
#ifdef	__SYMBIAN32__
sl@0
   325
 
sl@0
   326
OilFunctionImpl* __oil_function_impl_scalarmult_u16_unroll2x() {
sl@0
   327
        return &_oil_function_impl_scalarmult_u16_unroll2x;
sl@0
   328
}
sl@0
   329
#endif
sl@0
   330
sl@0
   331
#ifdef	__SYMBIAN32__
sl@0
   332
 
sl@0
   333
OilFunctionImpl* __oil_function_impl_scalarmult_s32_unroll2x() {
sl@0
   334
        return &_oil_function_impl_scalarmult_s32_unroll2x;
sl@0
   335
}
sl@0
   336
#endif
sl@0
   337
sl@0
   338
#ifdef	__SYMBIAN32__
sl@0
   339
 
sl@0
   340
OilFunctionImpl* __oil_function_impl_scalarmult_u32_unroll2x() {
sl@0
   341
        return &_oil_function_impl_scalarmult_u32_unroll2x;
sl@0
   342
}
sl@0
   343
#endif
sl@0
   344
sl@0
   345
#ifdef	__SYMBIAN32__
sl@0
   346
 
sl@0
   347
OilFunctionImpl* __oil_function_impl_scalarmult_f32_unroll2x() {
sl@0
   348
        return &_oil_function_impl_scalarmult_f32_unroll2x;
sl@0
   349
}
sl@0
   350
#endif
sl@0
   351
sl@0
   352
#ifdef	__SYMBIAN32__
sl@0
   353
 
sl@0
   354
OilFunctionImpl* __oil_function_impl_scalarmult_f64_unroll2x() {
sl@0
   355
        return &_oil_function_impl_scalarmult_f64_unroll2x;
sl@0
   356
}
sl@0
   357
#endif
sl@0
   358
sl@0
   359
#ifdef	__SYMBIAN32__
sl@0
   360
 
sl@0
   361
OilFunctionImpl* __oil_function_impl_scalarmult_s8_x() {
sl@0
   362
        return &_oil_function_impl_scalarmult_s8_x;
sl@0
   363
}
sl@0
   364
#endif
sl@0
   365
sl@0
   366
#ifdef	__SYMBIAN32__
sl@0
   367
 
sl@0
   368
OilFunctionImpl* __oil_function_impl_scalarmult_u8_x() {
sl@0
   369
        return &_oil_function_impl_scalarmult_u8_x;
sl@0
   370
}
sl@0
   371
#endif
sl@0
   372
sl@0
   373
#ifdef	__SYMBIAN32__
sl@0
   374
 
sl@0
   375
OilFunctionImpl* __oil_function_impl_scalarmult_s16_x() {
sl@0
   376
        return &_oil_function_impl_scalarmult_s16_x;
sl@0
   377
}
sl@0
   378
#endif
sl@0
   379
sl@0
   380
#ifdef	__SYMBIAN32__
sl@0
   381
 
sl@0
   382
OilFunctionImpl* __oil_function_impl_scalarmult_u16_x() {
sl@0
   383
        return &_oil_function_impl_scalarmult_u16_x;
sl@0
   384
}
sl@0
   385
#endif
sl@0
   386
sl@0
   387
#ifdef	__SYMBIAN32__
sl@0
   388
 
sl@0
   389
OilFunctionImpl* __oil_function_impl_scalarmult_s32_x() {
sl@0
   390
        return &_oil_function_impl_scalarmult_s32_x;
sl@0
   391
}
sl@0
   392
#endif
sl@0
   393
sl@0
   394
#ifdef	__SYMBIAN32__
sl@0
   395
 
sl@0
   396
OilFunctionImpl* __oil_function_impl_scalarmult_u32_x() {
sl@0
   397
        return &_oil_function_impl_scalarmult_u32_x;
sl@0
   398
}
sl@0
   399
#endif
sl@0
   400
sl@0
   401
#ifdef	__SYMBIAN32__
sl@0
   402
 
sl@0
   403
OilFunctionImpl* __oil_function_impl_scalarmult_f32_x() {
sl@0
   404
        return &_oil_function_impl_scalarmult_f32_x;
sl@0
   405
}
sl@0
   406
#endif
sl@0
   407
sl@0
   408
#ifdef	__SYMBIAN32__
sl@0
   409
 
sl@0
   410
OilFunctionImpl* __oil_function_impl_scalarmult_f64_x() {
sl@0
   411
        return &_oil_function_impl_scalarmult_f64_x;
sl@0
   412
}
sl@0
   413
#endif