Skip to content

Commit 2a25780

Browse files
committed
fix build
1 parent 3d507bd commit 2a25780

File tree

2 files changed

+3
-3
lines changed

2 files changed

+3
-3
lines changed

onnxruntime/contrib_ops/cuda/bert/group_query_attention_impl.cu

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -50,7 +50,6 @@ limitations under the License.
5050
#include "contrib_ops/cuda/utils/dump_cuda_tensor.h"
5151
#include "core/providers/cuda/cu_inc/common.cuh"
5252
#include "core/providers/cuda/cuda_type_conversion.h"
53-
5453
#include "core/providers/cuda/shared_inc/cuda_call.h"
5554
#include "core/providers/cuda/shared_inc/fpgeneric.h"
5655

onnxruntime/contrib_ops/cuda/bert/group_query_attention_qkv.cuh

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -12,6 +12,7 @@
1212
#include "contrib_ops/cpu/bert/attention_common.h"
1313
#include "contrib_ops/cuda/bert/rotary_common.cuh"
1414
#include "core/providers/cuda/cuda_common.h"
15+
#include "core/providers/cuda/cuda_type_conversion.h"
1516
#include "core/providers/cuda/shared_inc/cuda_call.h"
1617

1718
using namespace onnxruntime::cuda;
@@ -304,8 +305,8 @@ Status LaunchUnpackRoPEAppend(
304305
const int rotary_dim, const int64_t* position_ids, const bool interleaved,
305306
const bool is_cache_bnsh, const KVQuantizationType k_quant_type,
306307
cudaStream_t stream, const int max_threads_per_block) {
307-
static_assert(std::is_same<T, typename OrtToCudaType<T>::type>::value);
308-
static_assert(std::is_same<U, typename OrtToCudaType<U>::type>::value);
308+
static_assert(std::is_same<T, typename onnxruntime::cuda::OrtToCudaType<T>::type>::value);
309+
static_assert(std::is_same<U, typename onnxruntime::cuda::OrtToCudaType<U>::type>::value);
309310

310311
constexpr int elements_per_vector = sizeof(float4) / sizeof(T);
311312

0 commit comments

Comments
 (0)