[Libclc-dev] [PATCH 02/15] Implement half_rsqrt builtin v2

Jan Vesely jan.vesely at rutgers.edu
Fri Apr 10 16:22:07 PDT 2015


On Tue, 2015-04-07 at 18:05 +0000, Tom Stellard wrote:
> This is a generic implementation which just calls rsqrt.
> Targets should override this if they want a faster implementation.
> 
> v2:
>   - Alphabettize SOURCES
> ---
>  generic/include/clc/clc.h             |  1 +
>  generic/include/clc/math/half_rsqrt.h | 31 +++++++++++++++++++++++++++++++
>  generic/lib/SOURCES                   |  1 +
>  generic/lib/math/half_rsqrt.cl        | 30 ++++++++++++++++++++++++++++++
>  generic/lib/math/half_rsqrt.inc       | 25 +++++++++++++++++++++++++
>  5 files changed, 88 insertions(+)
>  create mode 100644 generic/include/clc/math/half_rsqrt.h
>  create mode 100644 generic/lib/math/half_rsqrt.cl
>  create mode 100644 generic/lib/math/half_rsqrt.inc
> 
> diff --git a/generic/include/clc/clc.h b/generic/include/clc/clc.h
> index 193c42b..b5ecda3 100644
> --- a/generic/include/clc/clc.h
> +++ b/generic/include/clc/clc.h
> @@ -56,6 +56,7 @@
>  #include <clc/math/fmax.h>
>  #include <clc/math/fmin.h>
>  #include <clc/math/fmod.h>
> +#include <clc/math/half_rsqrt.h>
>  #include <clc/math/half_sqrt.h>
>  #include <clc/math/hypot.h>
>  #include <clc/math/log.h>
> diff --git a/generic/include/clc/math/half_rsqrt.h b/generic/include/clc/math/half_rsqrt.h
> new file mode 100644
> index 0000000..e367d82
> --- /dev/null
> +++ b/generic/include/clc/math/half_rsqrt.h
> @@ -0,0 +1,31 @@
> +/*
> + * Copyright (c) 2014,2015 Advanced Micro Devices, Inc.
> + *
> + * Permission is hereby granted, free of charge, to any person obtaining a copy
> + * of this software and associated documentation files (the "Software"), to deal
> + * in the Software without restriction, including without limitation the rights
> + * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
> + * copies of the Software, and to permit persons to whom the Software is
> + * furnished to do so, subject to the following conditions:
> + *
> + * The above copyright notice and this permission notice shall be included in
> + * all copies or substantial portions of the Software.
> + *
> + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
> + * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
> + * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
> + * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
> + * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
> + * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
> + * THE SOFTWARE.
> + */
> +
> +#undef half_rsqrt
> +
> +#define __CLC_BODY <clc/math/unary_decl.inc>
> +#define __CLC_FUNCTION half_rsqrt
> +
> +#include <clc/math/gentype.inc>
> +
> +#undef __CLC_BODY
> +#undef __CLC_FUNCTION
> diff --git a/generic/lib/SOURCES b/generic/lib/SOURCES
> index b360278..92067ea 100644
> --- a/generic/lib/SOURCES
> +++ b/generic/lib/SOURCES
> @@ -79,6 +79,7 @@ math/exp10.cl
>  math/fmax.cl
>  math/fmin.cl
>  math/fmod.cl
> +math/half_rsqrt.cl
>  math/half_sqrt.cl
>  math/hypot.cl
>  math/log10.cl
> diff --git a/generic/lib/math/half_rsqrt.cl b/generic/lib/math/half_rsqrt.cl
> new file mode 100644
> index 0000000..85695b0
> --- /dev/null
> +++ b/generic/lib/math/half_rsqrt.cl
> @@ -0,0 +1,30 @@
> +/*
> + * Copyright (c) 2014,2015 Advanced Micro Devices, Inc.
> + *
> + * Permission is hereby granted, free of charge, to any person obtaining a copy
> + * of this software and associated documentation files (the "Software"), to deal
> + * in the Software without restriction, including without limitation the rights
> + * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
> + * copies of the Software, and to permit persons to whom the Software is
> + * furnished to do so, subject to the following conditions:
> + *
> + * The above copyright notice and this permission notice shall be included in
> + * all copies or substantial portions of the Software.
> + *
> + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
> + * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
> + * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
> + * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
> + * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
> + * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
> + * THE SOFTWARE.
> + */
> +
> +#include <clc/clc.h>
> +
> +#ifdef cl_khr_fp64
> +#pragma OPENCL EXTENSION cl_khr_fp64 : enable
> +#endif

do we need the above? I know we use it for half_sqrt too, but the specs
only mention floatN as gentype allowed for half_ functions (table 6.9)

jan

> +
> +#define __CLC_BODY <half_rsqrt.inc>
> +#include <clc/math/gentype.inc>
> diff --git a/generic/lib/math/half_rsqrt.inc b/generic/lib/math/half_rsqrt.inc
> new file mode 100644
> index 0000000..33ce6c2
> --- /dev/null
> +++ b/generic/lib/math/half_rsqrt.inc
> @@ -0,0 +1,25 @@
> +/*
> + * Copyright (c) 2014,2015 Advanced Micro Devices, Inc.
> + *
> + * Permission is hereby granted, free of charge, to any person obtaining a copy
> + * of this software and associated documentation files (the "Software"), to deal
> + * in the Software without restriction, including without limitation the rights
> + * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
> + * copies of the Software, and to permit persons to whom the Software is
> + * furnished to do so, subject to the following conditions:
> + *
> + * The above copyright notice and this permission notice shall be included in
> + * all copies or substantial portions of the Software.
> + *
> + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
> + * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
> + * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
> + * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
> + * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
> + * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
> + * THE SOFTWARE.
> + */
> +
> +_CLC_OVERLOAD _CLC_DEF __CLC_GENTYPE half_rsqrt(__CLC_GENTYPE val) {
> +  return rsqrt(val);
> +}

-- 
Jan Vesely <jan.vesely at rutgers.edu>
-------------- next part --------------
A non-text attachment was scrubbed...
Name: signature.asc
Type: application/pgp-signature
Size: 819 bytes
Desc: This is a digitally signed message part
URL: <http://lists.llvm.org/pipermail/libclc-dev/attachments/20150410/310057d6/attachment.sig>


More information about the Libclc-dev mailing list