cuda:移除无用cpu代码

miaobyte · miaobyte · commit b722c0bca148 · 2025-03-07T21:43:36.000+08:00
diff --git a/excuter/op-mem-cuda/CMakeLists.txt b/excuter/op-mem-cuda/CMakeLists.txt
@@ -32,7 +32,8 @@ file(GLOB_RECURSE CLIENT_SOURCES "src/client/*.cpp")
 # include(FetchContent)
 
 find_package(CUDAToolkit REQUIRED COMPONENTS cublas)
-set(CUDA_TOOLKIT_ROOT_DIR /usr/local/cuda-12.6)  # 根据您的安装路径进行调整
+include_directories(${CUDAToolkit_INCLUDE_DIRS})
+
 set(CMAKE_CUDA_STANDARD 17)
 set(CMAKE_CUDA_ARCHITECTURES 61)  # 根据您的 GPU 计算能力进行调整
 set(CMAKE_CUDA_SEPARABLE_COMPILATION ON) #确保 CMake 能够正确识别 CUDA 文件并将其编译为目标
diff --git a/excuter/op-mem-cuda/src/deepx/tensorfunc/equal.hpp b/excuter/op-mem-cuda/src/deepx/tensorfunc/equal.hpp
@@ -1,8 +1,7 @@
 #ifndef DEEPX_TENSORFUNC_EQUAL_HPP
 #define DEEPX_TENSORFUNC_EQUAL_HPP
 #include <cmath>
-#include <omp.h>
-
+ 
 #include "deepx/tensor.hpp"
 #include "deepx/shape.hpp"
 namespace deepx::tensorfunc
diff --git a/excuter/op-mem-cuda/src/deepx/tensorfunc/matmul.hpp b/excuter/op-mem-cuda/src/deepx/tensorfunc/matmul.hpp
@@ -1,7 +1,6 @@
 #ifndef DEEPX_TENSORFUNC_MATMUL_HPP
 #define DEEPX_TENSORFUNC_MATMUL_HPP
-
-#include <cblas.h> // 如果使用 OpenBLAS
+ 
 #include "deepx/tensor.hpp"
 
 namespace deepx::tensorfunc
diff --git a/excuter/op-mem-cuda/src/deepx/tensorfunc/reduce.hpp b/excuter/op-mem-cuda/src/deepx/tensorfunc/reduce.hpp
@@ -5,7 +5,6 @@
 #include <algorithm>
 #include <stdexcept>
 #include <deepx/vector_combination.hpp>
-#include <hwy/highway.h>
  
 #include "deepx/tensor.hpp"
 #include "deepx/shape_reduce.hpp"