12345678910111213141516171819202122232425262728293031323334353637383940414243444546 |
- #include <cmath>
- #include <memory>
- #include <stdexcept>
- #include <hip/hip_fp16.h>
- #include <hip/hip_runtime.h>
- #include <math.h>
- namespace {
- template <class T, class F>
- __global__ void global_entry_point(F f, T* out)
- {
- *out = f();
- }
- template <class T, class F>
- bool verify(F f, T expected)
- {
- std::unique_ptr<T> cpu_T(new T);
- T* gpu_T = nullptr;
- if (hipMalloc((void**)&gpu_T, sizeof(T)) != hipSuccess) {
- return false;
- }
- bool result = true;
- hipLaunchKernelGGL(global_entry_point, 1, 1, 0, 0, f, gpu_T);
- result = hipMemcpy(cpu_T.get(), gpu_T, sizeof(T), hipMemcpyDeviceToHost) ==
- hipSuccess &&
- result;
- result = hipFree(gpu_T) == hipSuccess && result;
- result = *cpu_T == expected && result;
- return result;
- }
- }
- int main(int argc, char** argv)
- {
- bool valid = verify([] __device__() { return std::round(1.4f); }, 1.0f);
- valid &= verify([] __device__() { return max<_Float16>(1.0f, 2.0f); }, 2.0f);
- valid &= verify([] __device__() { return min<_Float16>(1.0f, 2.0f); }, 1.0f);
- if (valid) {
- return 0;
- } else {
- return 1;
- }
- }
|