genericopenlibs/liboil/src/i386/conv_sse.c
changeset 18 47c74d1534e1
equal deleted inserted replaced
0:e4d67989cc36 18:47c74d1534e1
       
     1 /*
       
     2  * LIBOIL - Library of Optimized Inner Loops
       
     3  * Copyright (c) 2003,2004 David A. Schleef <ds@schleef.org>
       
     4  * All rights reserved.
       
     5  *
       
     6  * Redistribution and use in source and binary forms, with or without
       
     7  * modification, are permitted provided that the following conditions
       
     8  * are met:
       
     9  * 1. Redistributions of source code must retain the above copyright
       
    10  *    notice, this list of conditions and the following disclaimer.
       
    11  * 2. Redistributions in binary form must reproduce the above copyright
       
    12  *    notice, this list of conditions and the following disclaimer in the
       
    13  *    documentation and/or other materials provided with the distribution.
       
    14  * 
       
    15  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
       
    16  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
       
    17  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
       
    18  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT,
       
    19  * INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
       
    20  * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
       
    21  * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
       
    22  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
       
    23  * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING
       
    24  * IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
       
    25  * POSSIBILITY OF SUCH DAMAGE.
       
    26  */
       
    27 //Portions Copyright (c)  2008-2009 Nokia Corporation and/or its subsidiary(-ies). All rights reserved. 
       
    28 
       
    29 #ifdef HAVE_CONFIG_H
       
    30 #include "config.h"
       
    31 #endif
       
    32 #include <liboil/liboilfunction.h>
       
    33 #include <liboil/liboilclasses.h>
       
    34 
       
    35 
       
    36 /* suboptimal */
       
    37 static void conv_f64_s32_sse(double *dst, int dst_stride, int32_t *src, int src_stride, int n)
       
    38 {
       
    39 #if !defined(__WINSCW__) && !defined(__WINS__)      
       
    40 	int i;
       
    41 
       
    42 	for(i=0;i<n;i++){
       
    43 		asm volatile(
       
    44 			"	cvtsi2sd 0(%0), %%xmm0		\n"
       
    45 			"	movq %%xmm0, 0(%1)		\n"
       
    46 			:
       
    47 			: "a" (src), "c" (dst)
       
    48 			/* : "xmm0" */
       
    49 		);
       
    50 		dst = OIL_OFFSET(dst, dst_stride);
       
    51 		src = OIL_OFFSET(src, src_stride);
       
    52 	}
       
    53 #endif	
       
    54 }
       
    55 OIL_DEFINE_IMPL_FULL(conv_f64_s32_sse, conv_f64_s32, OIL_IMPL_FLAG_SSE2);
       
    56 
       
    57 /* suboptimal */
       
    58 static void conv_s32_f64_sse(int32_t *dst, int dst_stride, double *src, int src_stride, int n)
       
    59 {
       
    60 #if !defined(__WINSCW__) && !defined(__WINS__)      
       
    61 	int i;
       
    62 	int eax;
       
    63 
       
    64 	for(i=0;i<n;i++){
       
    65 		asm volatile(
       
    66 			"	cvtsd2si 0(%1), %0		\n"
       
    67 			: "=a" (eax)
       
    68 			: "c" (src)
       
    69 		);
       
    70 		*dst = eax;
       
    71 		dst = OIL_OFFSET(dst, dst_stride);
       
    72 		src = OIL_OFFSET(src, src_stride);
       
    73 	}
       
    74 #endif	
       
    75 }
       
    76 OIL_DEFINE_IMPL_FULL(conv_s32_f64_sse, conv_s32_f64, OIL_IMPL_FLAG_SSE2);
       
    77 
       
    78 /* suboptimal */
       
    79 static void conv_s32_f32_sse(int32_t *dst, int dst_stride, double *src, int src_stride, int n)
       
    80 {
       
    81 #if !defined(__WINSCW__) && !defined(__WINS__)      
       
    82 	int i;
       
    83 
       
    84 	for(i=0;i<n;i++){
       
    85 		asm volatile(
       
    86                     "  movd 0(%1), %%xmm0\n"
       
    87 		    "  cvtps2pi %%xmm0, %%mm0\n"
       
    88                     "  movd %%mm0, 0(%0)\n"
       
    89 			:
       
    90                         : "r" (dst), "r" (src)
       
    91 		);
       
    92 		dst = OIL_OFFSET(dst, dst_stride);
       
    93 		src = OIL_OFFSET(src, src_stride);
       
    94 	}
       
    95         asm volatile ("emms\n");
       
    96 #endif
       
    97 }
       
    98 OIL_DEFINE_IMPL_FULL(conv_s32_f32_sse, conv_s32_f32, OIL_IMPL_FLAG_SSE2 | OIL_IMPL_FLAG_MMX);
       
    99 
       
   100 
       
   101 
       
   102 #ifdef	__SYMBIAN32__
       
   103  
       
   104 OilFunctionImpl* __oil_function_impl_conv_f64_s32_sse, conv_f64_s32() {
       
   105 		return &_oil_function_impl_conv_f64_s32_sse, conv_f64_s32;
       
   106 }
       
   107 #endif
       
   108 
       
   109 #ifdef	__SYMBIAN32__
       
   110  
       
   111 OilFunctionImpl* __oil_function_impl_conv_s32_f64_sse, conv_s32_f64() {
       
   112 		return &_oil_function_impl_conv_s32_f64_sse, conv_s32_f64;
       
   113 }
       
   114 #endif
       
   115 
       
   116 #ifdef	__SYMBIAN32__
       
   117  
       
   118 OilFunctionImpl* __oil_function_impl_conv_s32_f32_sse, conv_s32_f32() {
       
   119 		return &_oil_function_impl_conv_s32_f32_sse, conv_s32_f32;
       
   120 }
       
   121 #endif
       
   122