[libc-commits] [PATCH] D153388: [libc] Add basic utility support for timing functions on the GPU
Joseph Huber via Phabricator via libc-commits
libc-commits at lists.llvm.org
Tue Jun 20 19:14:32 PDT 2023
jhuber6 updated this revision to Diff 533103.
jhuber6 added a comment.
-> LIBC_HAS_BUILTIN
Repository:
rG LLVM Github Monorepo
CHANGES SINCE LAST ACTION
https://reviews.llvm.org/D153388/new/
https://reviews.llvm.org/D153388
Files:
libc/src/__support/GPU/amdgpu/utils.h
libc/src/__support/GPU/generic/utils.h
libc/src/__support/GPU/nvptx/utils.h
Index: libc/src/__support/GPU/nvptx/utils.h
===================================================================
--- libc/src/__support/GPU/nvptx/utils.h
+++ libc/src/__support/GPU/nvptx/utils.h
@@ -134,6 +134,20 @@
__nvvm_bar_warp_sync(mask);
}
+/// Returns the current value of the GPU's processor clock.
+LIBC_INLINE uint64_t clock() {
+ uint64_t timestamp;
+ asm volatile("mov.u64 %0, %%clock64;" : "=l"(timestamp));
+ return timestamp;
+}
+
+/// Returns a global fixed-frequency timer at nanosecond frequency.
+LIBC_INLINE uint64_t time() {
+ uint64_t nsecs;
+ asm volatile("mov.u64 %0, %%globaltimer;" : "=l"(nsecs));
+ return nsecs;
+}
+
} // namespace gpu
} // namespace __llvm_libc
Index: libc/src/__support/GPU/generic/utils.h
===================================================================
--- libc/src/__support/GPU/generic/utils.h
+++ libc/src/__support/GPU/generic/utils.h
@@ -67,6 +67,10 @@
LIBC_INLINE void sync_lane(uint64_t) {}
+LIBC_INLINE uint64_t clock() { return 0; }
+
+LIBC_INLINE uint64_t time() { return 0; }
+
} // namespace gpu
} // namespace __llvm_libc
Index: libc/src/__support/GPU/amdgpu/utils.h
===================================================================
--- libc/src/__support/GPU/amdgpu/utils.h
+++ libc/src/__support/GPU/amdgpu/utils.h
@@ -10,6 +10,7 @@
#define LLVM_LIBC_SRC_SUPPORT_GPU_AMDGPU_IO_H
#include "src/__support/common.h"
+#include "src/__support/macros/config.h"
#include <stdint.h>
@@ -144,6 +145,21 @@
__builtin_amdgcn_wave_barrier();
}
+/// Returns the current value of the GPU's processor clock.
+/// NOTE: The RDNA3 architecture replaced this with a 20-bit cycle counter.
+LIBC_INLINE uint64_t clock() { return __builtin_readcyclecounter(); }
+
+/// Returns a fixed-frequency timestamp. The actual frequency is dependent on
+/// the card and can only be queried via the driver.
+LIBC_INLINE uint64_t time() {
+ if constexpr (LIBC_HAS_BUILTIN(__builtin_amdgcn_s_sendmsg_rtnl))
+ return __builtin_amdgcn_s_sendmsg_rtnl(0x83);
+ else if constexpr (LIBC_HAS_BUILTIN(__builtin_amdgcn_s_memrealtime))
+ return __builtin_amdgcn_s_memrealtime();
+ else
+ return __builtin_amdgcn_s_memtime();
+}
+
} // namespace gpu
} // namespace __llvm_libc
-------------- next part --------------
A non-text attachment was scrubbed...
Name: D153388.533103.patch
Type: text/x-patch
Size: 2258 bytes
Desc: not available
URL: <http://lists.llvm.org/pipermail/libc-commits/attachments/20230621/b9b8ae32/attachment.bin>
More information about the libc-commits
mailing list