File tree Expand file tree Collapse file tree 2 files changed +2
-4
lines changed
onnxruntime/core/providers/cuda/llm Expand file tree Collapse file tree 2 files changed +2
-4
lines changed Original file line number Diff line number Diff line change 44#include " core/providers/cuda/cuda_common.h"
55#include " core/providers/cpu/llm/attention_helper.h"
66#include " core/providers/cuda/llm/attention.h"
7- #include " core/providers/cuda/llm/attention_naive.h"
87#include " contrib_ops/cuda/bert/attention_data.h"
98#include " contrib_ops/cuda/bert/attention_impl.h"
109
Original file line number Diff line number Diff line change @@ -9,10 +9,9 @@ namespace onnxruntime {
99namespace cuda {
1010
1111using namespace onnxruntime ::cuda;
12- 1Code has alerts.Press enter to view.
1312
14- template <typename T>
15- class Attention final : public CudaKernel {
13+ template <typename T>
14+ class Attention final : public CudaKernel {
1615 public:
1716 Attention (const OpKernelInfo& info);
1817 Status ComputeInternal (OpKernelContext* context) const override ;
You can’t perform that action at this time.
0 commit comments