|
1 /* |
|
2 * LIBOIL - Library of Optimized Inner Loops |
|
3 * Copyright (c) 2003,2004 David A. Schleef <ds@schleef.org> |
|
4 * All rights reserved. |
|
5 * |
|
6 * Redistribution and use in source and binary forms, with or without |
|
7 * modification, are permitted provided that the following conditions |
|
8 * are met: |
|
9 * 1. Redistributions of source code must retain the above copyright |
|
10 * notice, this list of conditions and the following disclaimer. |
|
11 * 2. Redistributions in binary form must reproduce the above copyright |
|
12 * notice, this list of conditions and the following disclaimer in the |
|
13 * documentation and/or other materials provided with the distribution. |
|
14 * |
|
15 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR |
|
16 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED |
|
17 * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE |
|
18 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, |
|
19 * INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES |
|
20 * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR |
|
21 * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) |
|
22 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, |
|
23 * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING |
|
24 * IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE |
|
25 * POSSIBILITY OF SUCH DAMAGE. |
|
26 */ |
|
27 //Portions Copyright (c) 2008-2009 Nokia Corporation and/or its subsidiary(-ies). All rights reserved. |
|
28 |
|
29 #ifdef HAVE_CONFIG_H |
|
30 #include "config.h" |
|
31 #endif |
|
32 |
|
33 #include <liboil/liboilfunction.h> |
|
34 #include "liboil/simdpack/simdpack.h" |
|
35 |
|
36 /* This is a suprisingly fast implementation of clipping |
|
37 * in straight C. It would be difficult to do it faster in asm |
|
38 * without specialized opcodes. */ |
|
39 |
|
40 static void |
|
41 clip_s16_fast (int16_t *dest, int dstr, int16_t *src, int sstr, int n, |
|
42 int16_t *low, int16_t *hi) |
|
43 { |
|
44 int i; |
|
45 int32_t x; |
|
46 |
|
47 for(i=0;i<n;i++){ |
|
48 x = OIL_GET(src,i*sstr, int16_t); |
|
49 x = x - (((x-*low)>>31)&(x-*low)) + (((*hi-x)>>31)&(*hi-x)); |
|
50 OIL_GET(dest,i*dstr, int16_t) = x; |
|
51 } |
|
52 } |
|
53 |
|
54 OIL_DEFINE_IMPL (clip_s16_fast, clip_s16); |
|
55 |
|
56 static void |
|
57 clip_s16_fast2 (int16_t *dest, int dstr, int16_t *src, int sstr, int n, |
|
58 int16_t *low, int16_t *hi) |
|
59 { |
|
60 int32_t x1, x2; |
|
61 |
|
62 if (n&1) { |
|
63 x1 = *src; |
|
64 OIL_INCREMENT(src,sstr); |
|
65 x1 -= (((x1-*low)>>31)&(x1-*low)); |
|
66 *dest = x1 + (((*hi-x1)>>31)&(*hi-x1)); |
|
67 OIL_INCREMENT(dest,dstr); |
|
68 n--; |
|
69 } |
|
70 while(n>0){ |
|
71 x1 = *src; |
|
72 OIL_INCREMENT(src,sstr); |
|
73 x2 = *src; |
|
74 OIL_INCREMENT(src,sstr); |
|
75 x1 -= (((x1-*low)>>31)&(x1-*low)); |
|
76 x2 -= (((x2-*low)>>31)&(x2-*low)); |
|
77 *dest = x1 + (((*hi-x1)>>31)&(*hi-x1)); |
|
78 OIL_INCREMENT(dest,dstr); |
|
79 *dest = x2 + (((*hi-x2)>>31)&(*hi-x2)); |
|
80 OIL_INCREMENT(dest,dstr); |
|
81 n-=2; |
|
82 } |
|
83 } |
|
84 OIL_DEFINE_IMPL (clip_s16_fast2, clip_s16); |
|
85 |
|
86 |
|
87 |
|
88 |
|
89 #if 0 |
|
90 /* broken */ |
|
91 |
|
92 /* This trick clips |
|
93 * the range min^(1<<31) to max^(1<<31) incorrectly with int32_t. |
|
94 * Thus the use of int64_t. */ |
|
95 |
|
96 static void |
|
97 clip_s32_fast (int32_t *dest, int dstr, int32_t *src, int sstr, int n, |
|
98 int32_t *low, int32_t *hi) |
|
99 { |
|
100 int i; |
|
101 int64_t x; |
|
102 |
|
103 for(i=0;i<n;i++){ |
|
104 x = OIL_GET(src,i*sstr,int32_t); |
|
105 x = x - (((x-*low)>>63)&(x-*low)) + (((*hi-x)>>63)&(*hi-x)); |
|
106 OIL_GET(dest,i*dstr,int32_t) = x; |
|
107 } |
|
108 } |
|
109 |
|
110 OIL_DEFINE_IMPL (clip_s32_fast, clip_s32); |
|
111 #endif |
|
112 |
|
113 |
|
114 |
|
115 |
|
116 #ifdef __SYMBIAN32__ |
|
117 |
|
118 OilFunctionImpl* __oil_function_impl_clip_s16_fast() { |
|
119 return &_oil_function_impl_clip_s16_fast; |
|
120 } |
|
121 #endif |
|
122 |
|
123 #ifdef __SYMBIAN32__ |
|
124 |
|
125 OilFunctionImpl* __oil_function_impl_clip_s16_fast2() { |
|
126 return &_oil_function_impl_clip_s16_fast2; |
|
127 } |
|
128 #endif |
|
129 #if 0 |
|
130 #ifdef __SYMBIAN32__ |
|
131 |
|
132 OilFunctionImpl* __oil_function_impl_clip_s32_fast() { |
|
133 return &_oil_function_impl_clip_s32_fast; |
|
134 } |
|
135 #endif |
|
136 #endif |