3#include <cuda_runtime.h>
17 FP8Format format_a = FP8Format::e4m3;
18 FP8Format format_b = FP8Format::e4m3;
24bool is_hopper_architecture();
26void fp8_gemm(const __half* A, const __half* B, __half* C,
28 const FP8GEMMConfig& config,
29 cudaStream_t stream = nullptr);
31void fp8_gemm_fallback(const __half* A, const __half* B, __half* C,
33 const FP8GEMMConfig& config,
34 cudaStream_t stream = nullptr);
36} // namespace hpc::cuda13