From f94f9e411f9a454263b6f0714fc85b8da5b150f3 Mon Sep 17 00:00:00 2001 From: Brian Li Date: Thu, 1 Jun 2023 19:56:27 +0800 Subject: [PATCH] Add missing headers --- .../kernels/decoder_masked_multihead_attention_utils.h | 1 + src/fastertransformer/utils/cublasMMWrapper.h | 1 + src/fastertransformer/utils/cuda_fp8_utils.cu | 3 +++ 3 files changed, 5 insertions(+) diff --git a/src/fastertransformer/kernels/decoder_masked_multihead_attention_utils.h b/src/fastertransformer/kernels/decoder_masked_multihead_attention_utils.h index 075e61b3c..e6a25fdc3 100644 --- a/src/fastertransformer/kernels/decoder_masked_multihead_attention_utils.h +++ b/src/fastertransformer/kernels/decoder_masked_multihead_attention_utils.h @@ -20,6 +20,7 @@ #include "src/fastertransformer/utils/cuda_fp8_utils.h" #include "src/fastertransformer/utils/cuda_type_utils.cuh" #include +#include using namespace fastertransformer; diff --git a/src/fastertransformer/utils/cublasMMWrapper.h b/src/fastertransformer/utils/cublasMMWrapper.h index 0c7ecbffa..c656f8098 100644 --- a/src/fastertransformer/utils/cublasMMWrapper.h +++ b/src/fastertransformer/utils/cublasMMWrapper.h @@ -20,6 +20,7 @@ #include #include #include +#include #include #include #include diff --git a/src/fastertransformer/utils/cuda_fp8_utils.cu b/src/fastertransformer/utils/cuda_fp8_utils.cu index f5e1d2465..618c5d8c0 100644 --- a/src/fastertransformer/utils/cuda_fp8_utils.cu +++ b/src/fastertransformer/utils/cuda_fp8_utils.cu @@ -16,6 +16,9 @@ #include "cuda_fp8_utils.h" +#include +#include + namespace fastertransformer { #ifdef ENABLE_FP8