aboutsummaryrefslogtreecommitdiff
path: root/src/builtins/sincos.cl
blob: 1552f6b32c6d5b8401c303927bd31d088eebce19 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
/******************************************************************************
 * Copyright (c) 2011-2014, Texas Instruments Incorporated - http://www.ti.com/
 *   All rights reserved.
 *
 *   Redistribution and use in source and binary forms, with or without
 *   modification, are permitted provided that the following conditions are met:
 *       * Redistributions of source code must retain the above copyright
 *         notice, this list of conditions and the following disclaimer.
 *       * Redistributions in binary form must reproduce the above copyright
 *         notice, this list of conditions and the following disclaimer in the
 *         documentation and/or other materials provided with the distribution.
 *       * Neither the name of Texas Instruments Incorporated nor the
 *         names of its contributors may be used to endorse or promote products
 *         derived from this software without specific prior written permission.
 *
 *   THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 *   AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 *   IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 
 *   ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
 *   LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
 *   CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
 *   SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
 *   INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
 *   CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
 *   ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
 *   THE POSSIBILITY OF SUCH DAMAGE.
 *****************************************************************************/
#include "clc.h"

_CLC_PROTECTED void sincosf(float x, float * sinval, float * cosval);
_CLC_PROTECTED void builtin_sincos(double x, double * sinval, double * cosval);

#define SINCOS_SCALAR_BODY(type, op) \
{ \
    type sin_val; \
    type cos_val; \
    op(x, &sin_val, &cos_val); \
    *cosval = cos_val; \
    return sin_val; \
} \

#define SINCOS_VECTOR_BODY_2(prim_type, op) \
    op(x.s0, &(((prim_type*)&sin_val)[0]), &(((prim_type*)&cos_val)[0])); \
    op(x.s1, &(((prim_type*)&sin_val)[1]), &(((prim_type*)&cos_val)[1])); \

#define SINCOS_VECTOR_BODY_3(prim_type, op) \
    SINCOS_VECTOR_BODY_2(prim_type, op) \
    op(x.s2, &(((prim_type*)&sin_val)[2]), &(((prim_type*)&cos_val)[2])); \

#define SINCOS_VECTOR_BODY_4(prim_type, op) \
    SINCOS_VECTOR_BODY_3(prim_type, op) \
    op(x.s3, &(((prim_type*)&sin_val)[3]), &(((prim_type*)&cos_val)[3])); \

#define SINCOS_VECTOR_BODY_8(prim_type, op) \
    SINCOS_VECTOR_BODY_4(prim_type, op) \
    op(x.s4, &(((prim_type*)&sin_val)[4]), &(((prim_type*)&cos_val)[4])); \
    op(x.s5, &(((prim_type*)&sin_val)[5]), &(((prim_type*)&cos_val)[5])); \
    op(x.s6, &(((prim_type*)&sin_val)[6]), &(((prim_type*)&cos_val)[6])); \
    op(x.s7, &(((prim_type*)&sin_val)[7]), &(((prim_type*)&cos_val)[7])); \

#define SINCOS_VECTOR_BODY_16(prim_type, op) \
    SINCOS_VECTOR_BODY_8(prim_type, op) \
    op(x.s8, &(((prim_type*)&sin_val)[8]), &(((prim_type*)&cos_val)[8])); \
    op(x.s9, &(((prim_type*)&sin_val)[9]), &(((prim_type*)&cos_val)[9])); \
    op(x.sa, &(((prim_type*)&sin_val)[10]), &(((prim_type*)&cos_val)[10])); \
    op(x.sb, &(((prim_type*)&sin_val)[11]), &(((prim_type*)&cos_val)[11])); \
    op(x.sc, &(((prim_type*)&sin_val)[12]), &(((prim_type*)&cos_val)[12])); \
    op(x.sd, &(((prim_type*)&sin_val)[13]), &(((prim_type*)&cos_val)[13])); \
    op(x.se, &(((prim_type*)&sin_val)[14]), &(((prim_type*)&cos_val)[14])); \
    op(x.sf, &(((prim_type*)&sin_val)[15]), &(((prim_type*)&cos_val)[15])); \

#define SINCOS_VECTOR_BODY(prim_type, num, op) \
{ \
    prim_type##num   sin_val; \
    prim_type##num   cos_val; \
    SINCOS_VECTOR_BODY_##num(prim_type, op)\
    *cosval =  cos_val; \
    return sin_val; \
} \

_CLC_OVERLOAD _CLC_INLINE float sincos(float x, global  float * cosval) SINCOS_SCALAR_BODY(float, sincosf)
_CLC_OVERLOAD _CLC_INLINE float sincos(float x, local   float * cosval) SINCOS_SCALAR_BODY(float, sincosf)
_CLC_OVERLOAD _CLC_INLINE float sincos(float x, private float * cosval) SINCOS_SCALAR_BODY(float, sincosf)

_CLC_OVERLOAD _CLC_DEF float2 sincos(float2 x, global  float2 * cosval) SINCOS_VECTOR_BODY(float, 2, sincosf)
_CLC_OVERLOAD _CLC_DEF float2 sincos(float2 x, local   float2 * cosval) SINCOS_VECTOR_BODY(float, 2, sincosf)
_CLC_OVERLOAD _CLC_DEF float2 sincos(float2 x, private float2 * cosval) SINCOS_VECTOR_BODY(float, 2, sincosf)

_CLC_OVERLOAD _CLC_DEF float3 sincos(float3 x, global  float3 * cosval) SINCOS_VECTOR_BODY(float, 3, sincosf)
_CLC_OVERLOAD _CLC_DEF float3 sincos(float3 x, local   float3 * cosval) SINCOS_VECTOR_BODY(float, 3, sincosf)
_CLC_OVERLOAD _CLC_DEF float3 sincos(float3 x, private float3 * cosval) SINCOS_VECTOR_BODY(float, 3, sincosf)

_CLC_OVERLOAD _CLC_DEF float4 sincos(float4 x, global  float4 * cosval) SINCOS_VECTOR_BODY(float, 4, sincosf)
_CLC_OVERLOAD _CLC_DEF float4 sincos(float4 x, local   float4 * cosval) SINCOS_VECTOR_BODY(float, 4, sincosf)
_CLC_OVERLOAD _CLC_DEF float4 sincos(float4 x, private float4 * cosval) SINCOS_VECTOR_BODY(float, 4, sincosf)

_CLC_OVERLOAD _CLC_DEF float8 sincos(float8 x, global  float8 * cosval) SINCOS_VECTOR_BODY(float, 8, sincosf)
_CLC_OVERLOAD _CLC_DEF float8 sincos(float8 x, local   float8 * cosval) SINCOS_VECTOR_BODY(float, 8, sincosf)
_CLC_OVERLOAD _CLC_DEF float8 sincos(float8 x, private float8 * cosval) SINCOS_VECTOR_BODY(float, 8, sincosf)

_CLC_OVERLOAD _CLC_DEF float16 sincos(float16 x, global  float16 * cosval) SINCOS_VECTOR_BODY(float, 16, sincosf)
_CLC_OVERLOAD _CLC_DEF float16 sincos(float16 x, local   float16 * cosval) SINCOS_VECTOR_BODY(float, 16, sincosf)
_CLC_OVERLOAD _CLC_DEF float16 sincos(float16 x, private float16 * cosval) SINCOS_VECTOR_BODY(float, 16, sincosf)

_CLC_OVERLOAD _CLC_DEF double sincos(double x, global  double * cosval) SINCOS_SCALAR_BODY(double, builtin_sincos)
_CLC_OVERLOAD _CLC_DEF double sincos(double x, local   double * cosval) SINCOS_SCALAR_BODY(double, builtin_sincos)
_CLC_OVERLOAD _CLC_DEF double sincos(double x, private double * cosval) SINCOS_SCALAR_BODY(double, builtin_sincos)

_CLC_OVERLOAD _CLC_DEF double2 sincos(double2 x, global  double2 * cosval) SINCOS_VECTOR_BODY(double, 2, builtin_sincos)
_CLC_OVERLOAD _CLC_DEF double2 sincos(double2 x, local   double2 * cosval) SINCOS_VECTOR_BODY(double, 2, builtin_sincos)
_CLC_OVERLOAD _CLC_DEF double2 sincos(double2 x, private double2 * cosval) SINCOS_VECTOR_BODY(double, 2, builtin_sincos)

_CLC_OVERLOAD _CLC_DEF double3 sincos(double3 x, global  double3 * cosval) SINCOS_VECTOR_BODY(double, 3, builtin_sincos)
_CLC_OVERLOAD _CLC_DEF double3 sincos(double3 x, local   double3 * cosval) SINCOS_VECTOR_BODY(double, 3, builtin_sincos)
_CLC_OVERLOAD _CLC_DEF double3 sincos(double3 x, private double3 * cosval) SINCOS_VECTOR_BODY(double, 3, builtin_sincos)

_CLC_OVERLOAD _CLC_DEF double4 sincos(double4 x, global  double4 * cosval) SINCOS_VECTOR_BODY(double, 4, builtin_sincos)
_CLC_OVERLOAD _CLC_DEF double4 sincos(double4 x, local   double4 * cosval) SINCOS_VECTOR_BODY(double, 4, builtin_sincos)
_CLC_OVERLOAD _CLC_DEF double4 sincos(double4 x, private double4 * cosval) SINCOS_VECTOR_BODY(double, 4, builtin_sincos)

_CLC_OVERLOAD _CLC_DEF double8 sincos(double8 x, global  double8 * cosval) SINCOS_VECTOR_BODY(double, 8, builtin_sincos)
_CLC_OVERLOAD _CLC_DEF double8 sincos(double8 x, local   double8 * cosval) SINCOS_VECTOR_BODY(double, 8, builtin_sincos)
_CLC_OVERLOAD _CLC_DEF double8 sincos(double8 x, private double8 * cosval) SINCOS_VECTOR_BODY(double, 8, builtin_sincos)

_CLC_OVERLOAD _CLC_DEF double16 sincos(double16 x, global  double16 * cosval) SINCOS_VECTOR_BODY(double, 16, builtin_sincos)
_CLC_OVERLOAD _CLC_DEF double16 sincos(double16 x, local   double16 * cosval) SINCOS_VECTOR_BODY(double, 16, builtin_sincos)
_CLC_OVERLOAD _CLC_DEF double16 sincos(double16 x, private double16 * cosval) SINCOS_VECTOR_BODY(double, 16, builtin_sincos)