[Libclc-dev] [PATCH 02/15] Implement half_rsqrt builtin v2
Jan Vesely
jan.vesely at rutgers.edu
Fri Apr 10 16:22:07 PDT 2015
On Tue, 2015-04-07 at 18:05 +0000, Tom Stellard wrote:
> This is a generic implementation which just calls rsqrt.
> Targets should override this if they want a faster implementation.
>
> v2:
> - Alphabettize SOURCES
> ---
> generic/include/clc/clc.h | 1 +
> generic/include/clc/math/half_rsqrt.h | 31 +++++++++++++++++++++++++++++++
> generic/lib/SOURCES | 1 +
> generic/lib/math/half_rsqrt.cl | 30 ++++++++++++++++++++++++++++++
> generic/lib/math/half_rsqrt.inc | 25 +++++++++++++++++++++++++
> 5 files changed, 88 insertions(+)
> create mode 100644 generic/include/clc/math/half_rsqrt.h
> create mode 100644 generic/lib/math/half_rsqrt.cl
> create mode 100644 generic/lib/math/half_rsqrt.inc
>
> diff --git a/generic/include/clc/clc.h b/generic/include/clc/clc.h
> index 193c42b..b5ecda3 100644
> --- a/generic/include/clc/clc.h
> +++ b/generic/include/clc/clc.h
> @@ -56,6 +56,7 @@
> #include <clc/math/fmax.h>
> #include <clc/math/fmin.h>
> #include <clc/math/fmod.h>
> +#include <clc/math/half_rsqrt.h>
> #include <clc/math/half_sqrt.h>
> #include <clc/math/hypot.h>
> #include <clc/math/log.h>
> diff --git a/generic/include/clc/math/half_rsqrt.h b/generic/include/clc/math/half_rsqrt.h
> new file mode 100644
> index 0000000..e367d82
> --- /dev/null
> +++ b/generic/include/clc/math/half_rsqrt.h
> @@ -0,0 +1,31 @@
> +/*
> + * Copyright (c) 2014,2015 Advanced Micro Devices, Inc.
> + *
> + * Permission is hereby granted, free of charge, to any person obtaining a copy
> + * of this software and associated documentation files (the "Software"), to deal
> + * in the Software without restriction, including without limitation the rights
> + * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
> + * copies of the Software, and to permit persons to whom the Software is
> + * furnished to do so, subject to the following conditions:
> + *
> + * The above copyright notice and this permission notice shall be included in
> + * all copies or substantial portions of the Software.
> + *
> + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
> + * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
> + * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
> + * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
> + * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
> + * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
> + * THE SOFTWARE.
> + */
> +
> +#undef half_rsqrt
> +
> +#define __CLC_BODY <clc/math/unary_decl.inc>
> +#define __CLC_FUNCTION half_rsqrt
> +
> +#include <clc/math/gentype.inc>
> +
> +#undef __CLC_BODY
> +#undef __CLC_FUNCTION
> diff --git a/generic/lib/SOURCES b/generic/lib/SOURCES
> index b360278..92067ea 100644
> --- a/generic/lib/SOURCES
> +++ b/generic/lib/SOURCES
> @@ -79,6 +79,7 @@ math/exp10.cl
> math/fmax.cl
> math/fmin.cl
> math/fmod.cl
> +math/half_rsqrt.cl
> math/half_sqrt.cl
> math/hypot.cl
> math/log10.cl
> diff --git a/generic/lib/math/half_rsqrt.cl b/generic/lib/math/half_rsqrt.cl
> new file mode 100644
> index 0000000..85695b0
> --- /dev/null
> +++ b/generic/lib/math/half_rsqrt.cl
> @@ -0,0 +1,30 @@
> +/*
> + * Copyright (c) 2014,2015 Advanced Micro Devices, Inc.
> + *
> + * Permission is hereby granted, free of charge, to any person obtaining a copy
> + * of this software and associated documentation files (the "Software"), to deal
> + * in the Software without restriction, including without limitation the rights
> + * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
> + * copies of the Software, and to permit persons to whom the Software is
> + * furnished to do so, subject to the following conditions:
> + *
> + * The above copyright notice and this permission notice shall be included in
> + * all copies or substantial portions of the Software.
> + *
> + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
> + * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
> + * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
> + * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
> + * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
> + * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
> + * THE SOFTWARE.
> + */
> +
> +#include <clc/clc.h>
> +
> +#ifdef cl_khr_fp64
> +#pragma OPENCL EXTENSION cl_khr_fp64 : enable
> +#endif
do we need the above? I know we use it for half_sqrt too, but the specs
only mention floatN as gentype allowed for half_ functions (table 6.9)
jan
> +
> +#define __CLC_BODY <half_rsqrt.inc>
> +#include <clc/math/gentype.inc>
> diff --git a/generic/lib/math/half_rsqrt.inc b/generic/lib/math/half_rsqrt.inc
> new file mode 100644
> index 0000000..33ce6c2
> --- /dev/null
> +++ b/generic/lib/math/half_rsqrt.inc
> @@ -0,0 +1,25 @@
> +/*
> + * Copyright (c) 2014,2015 Advanced Micro Devices, Inc.
> + *
> + * Permission is hereby granted, free of charge, to any person obtaining a copy
> + * of this software and associated documentation files (the "Software"), to deal
> + * in the Software without restriction, including without limitation the rights
> + * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
> + * copies of the Software, and to permit persons to whom the Software is
> + * furnished to do so, subject to the following conditions:
> + *
> + * The above copyright notice and this permission notice shall be included in
> + * all copies or substantial portions of the Software.
> + *
> + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
> + * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
> + * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
> + * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
> + * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
> + * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
> + * THE SOFTWARE.
> + */
> +
> +_CLC_OVERLOAD _CLC_DEF __CLC_GENTYPE half_rsqrt(__CLC_GENTYPE val) {
> + return rsqrt(val);
> +}
--
Jan Vesely <jan.vesely at rutgers.edu>
-------------- next part --------------
A non-text attachment was scrubbed...
Name: signature.asc
Type: application/pgp-signature
Size: 819 bytes
Desc: This is a digitally signed message part
URL: <http://lists.llvm.org/pipermail/libclc-dev/attachments/20150410/310057d6/attachment.sig>
More information about the Libclc-dev
mailing list