From 5a3ea35606c306c318200e525588ee1e3a3adb55 Mon Sep 17 00:00:00 2001 From: "peng.li24" Date: Mon, 26 Jan 2026 03:31:25 +0000 Subject: [PATCH] =?UTF-8?q?op-cuda:=E9=87=8D=E5=91=BD=E5=90=8D?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- .github/workflows/executor-op-cuda-linux.yml | 8 ++++---- executor/{op-mem-cuda => op-cuda}/.gitignore | 0 executor/{op-mem-cuda => op-cuda}/CMakeLists.txt | 0 executor/{op-mem-cuda => op-cuda}/Dockerfile | 0 executor/{op-mem-cuda => op-cuda}/README.md | 0 executor/op-cuda/build.sh | 4 ++++ executor/{op-mem-cuda => op-cuda}/dockerbuild.sh | 0 executor/{op-mem-cuda => op-cuda}/log.md | 0 executor/{op-mem-cuda => op-cuda}/src/client/main.cpp | 0 executor/{op-mem-cuda => op-cuda}/src/client/tfs.cpp | 0 executor/{op-mem-cuda => op-cuda}/src/client/tfs.hpp | 0 .../{op-mem-cuda => op-cuda}/src/deepx/dtype_cuda.hpp | 0 .../{op-mem-cuda => op-cuda}/src/deepx/mem/mem_cuda.hpp | 0 .../src/deepx/tensorfunc/changeshape_miaobyte.cu | 0 .../src/deepx/tensorfunc/changeshape_miaobyte.cuh | 0 .../src/deepx/tensorfunc/changeshape_miaobyte.hpp | 0 .../src/deepx/tensorfunc/cuda.hpp | 0 .../src/deepx/tensorfunc/cuda_atomic.cuh | 0 .../src/deepx/tensorfunc/cuda_math.cuh | 0 .../src/deepx/tensorfunc/elementwise_cublas_basic.hpp | 0 .../src/deepx/tensorfunc/elementwise_miaobyte_basic.cu | 0 .../src/deepx/tensorfunc/elementwise_miaobyte_basic.cuh | 0 .../src/deepx/tensorfunc/elementwise_miaobyte_basic.hpp | 0 .../src/deepx/tensorfunc/elementwise_miaobyte_compare.cu | 0 .../src/deepx/tensorfunc/elementwise_miaobyte_compare.cuh | 0 .../src/deepx/tensorfunc/elementwise_miaobyte_compare.hpp | 0 .../src/deepx/tensorfunc/elementwise_miaobyte_sin.cu | 0 .../src/deepx/tensorfunc/elementwise_miaobyte_sin.cuh | 0 .../src/deepx/tensorfunc/elementwise_miaobyte_sin.hpp | 0 .../src/deepx/tensorfunc/elementwise_miaobyte_sqrt.cu | 0 .../src/deepx/tensorfunc/elementwise_miaobyte_sqrt.cuh | 0 .../src/deepx/tensorfunc/elementwise_miaobyte_sqrt.hpp | 0 .../src/deepx/tensorfunc/init_miaobyte.cu | 0 .../src/deepx/tensorfunc/init_miaobyte.cuh | 0 .../src/deepx/tensorfunc/init_miaobyte.hpp | 0 .../src/deepx/tensorfunc/io_miaobyte.hpp | 0 .../src/deepx/tensorfunc/matmul_cublas.hpp | 0 .../src/deepx/tensorfunc/new_mempool.hpp | 0 .../src/deepx/tensorfunc/reduce_miaobyte.cu | 0 .../src/deepx/tensorfunc/reduce_miaobyte.cuh | 0 .../src/deepx/tensorfunc/reduce_miaobyte.hpp | 0 .../src/deepx/tensorfunc/tensor_cuda.cuh | 0 .../src/deepx/tensorfunc/tensorlife_miaobyte.hpp | 0 .../src/deepx/tensorfunc/vector_cuda.cuh | 0 executor/{op-mem-cuda => op-cuda}/src/deepx/tf/arg.hpp | 0 .../{op-mem-cuda => op-cuda}/src/deepx/tf/changeshape.hpp | 0 .../src/deepx/tf/elementwise_basic.hpp | 0 .../src/deepx/tf/elementwise_compare.hpp | 0 .../src/deepx/tf/elementwise_sin.hpp | 0 .../src/deepx/tf/elementwise_sqrt.hpp | 0 executor/{op-mem-cuda => op-cuda}/src/deepx/tf/init.hpp | 0 executor/{op-mem-cuda => op-cuda}/src/deepx/tf/io.hpp | 0 executor/{op-mem-cuda => op-cuda}/src/deepx/tf/matmul.hpp | 0 executor/{op-mem-cuda => op-cuda}/src/deepx/tf/reduce.hpp | 0 .../{op-mem-cuda => op-cuda}/src/deepx/tf/tensorlife.hpp | 0 executor/{op-mem-cuda => op-cuda}/test/op/CMakeLists.txt | 0 .../{op-mem-cuda => op-cuda}/test/tensorfunc/0_new.cpp | 0 .../test/tensorfunc/1_cublas_add.cpp | 0 .../test/tensorfunc/1_cublas_matmul.cpp | 0 .../test/tensorfunc/2_changeshape.cpp | 0 .../test/tensorfunc/CMakeLists.txt | 0 executor/op-mem-cuda/build.sh | 4 ---- 62 files changed, 8 insertions(+), 8 deletions(-) rename executor/{op-mem-cuda => op-cuda}/.gitignore (100%) rename executor/{op-mem-cuda => op-cuda}/CMakeLists.txt (100%) rename executor/{op-mem-cuda => op-cuda}/Dockerfile (100%) rename executor/{op-mem-cuda => op-cuda}/README.md (100%) create mode 100644 executor/op-cuda/build.sh rename executor/{op-mem-cuda => op-cuda}/dockerbuild.sh (100%) rename executor/{op-mem-cuda => op-cuda}/log.md (100%) rename executor/{op-mem-cuda => op-cuda}/src/client/main.cpp (100%) rename executor/{op-mem-cuda => op-cuda}/src/client/tfs.cpp (100%) rename executor/{op-mem-cuda => op-cuda}/src/client/tfs.hpp (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/dtype_cuda.hpp (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/mem/mem_cuda.hpp (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tensorfunc/changeshape_miaobyte.cu (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tensorfunc/changeshape_miaobyte.cuh (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tensorfunc/changeshape_miaobyte.hpp (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tensorfunc/cuda.hpp (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tensorfunc/cuda_atomic.cuh (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tensorfunc/cuda_math.cuh (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tensorfunc/elementwise_cublas_basic.hpp (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tensorfunc/elementwise_miaobyte_basic.cu (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tensorfunc/elementwise_miaobyte_basic.cuh (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tensorfunc/elementwise_miaobyte_basic.hpp (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tensorfunc/elementwise_miaobyte_compare.cu (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tensorfunc/elementwise_miaobyte_compare.cuh (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tensorfunc/elementwise_miaobyte_compare.hpp (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tensorfunc/elementwise_miaobyte_sin.cu (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tensorfunc/elementwise_miaobyte_sin.cuh (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tensorfunc/elementwise_miaobyte_sin.hpp (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tensorfunc/elementwise_miaobyte_sqrt.cu (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tensorfunc/elementwise_miaobyte_sqrt.cuh (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tensorfunc/elementwise_miaobyte_sqrt.hpp (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tensorfunc/init_miaobyte.cu (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tensorfunc/init_miaobyte.cuh (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tensorfunc/init_miaobyte.hpp (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tensorfunc/io_miaobyte.hpp (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tensorfunc/matmul_cublas.hpp (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tensorfunc/new_mempool.hpp (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tensorfunc/reduce_miaobyte.cu (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tensorfunc/reduce_miaobyte.cuh (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tensorfunc/reduce_miaobyte.hpp (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tensorfunc/tensor_cuda.cuh (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tensorfunc/tensorlife_miaobyte.hpp (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tensorfunc/vector_cuda.cuh (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tf/arg.hpp (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tf/changeshape.hpp (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tf/elementwise_basic.hpp (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tf/elementwise_compare.hpp (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tf/elementwise_sin.hpp (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tf/elementwise_sqrt.hpp (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tf/init.hpp (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tf/io.hpp (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tf/matmul.hpp (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tf/reduce.hpp (100%) rename executor/{op-mem-cuda => op-cuda}/src/deepx/tf/tensorlife.hpp (100%) rename executor/{op-mem-cuda => op-cuda}/test/op/CMakeLists.txt (100%) rename executor/{op-mem-cuda => op-cuda}/test/tensorfunc/0_new.cpp (100%) rename executor/{op-mem-cuda => op-cuda}/test/tensorfunc/1_cublas_add.cpp (100%) rename executor/{op-mem-cuda => op-cuda}/test/tensorfunc/1_cublas_matmul.cpp (100%) rename executor/{op-mem-cuda => op-cuda}/test/tensorfunc/2_changeshape.cpp (100%) rename executor/{op-mem-cuda => op-cuda}/test/tensorfunc/CMakeLists.txt (100%) delete mode 100644 executor/op-mem-cuda/build.sh diff --git a/.github/workflows/executor-op-cuda-linux.yml b/.github/workflows/executor-op-cuda-linux.yml index e9c94037..6f7b81b8 100644 --- a/.github/workflows/executor-op-cuda-linux.yml +++ b/.github/workflows/executor-op-cuda-linux.yml @@ -2,10 +2,10 @@ name: Excuter/cuda-linux Build on: push: paths: - - 'executor/op-mem-cuda/**' + - 'executor/op-cuda/**' pull_request: paths: - - 'executor/op-mem-cuda/**' + - 'executor/op-cuda/**' env: CUDA_VERSION: "12.6.0" CUDA_MAJOR_VERSION: "12" @@ -34,7 +34,7 @@ jobs: run: | docker run --rm -v ${{ github.workspace }}:/workspace \ -w /workspace \ - nvidia/cuda:12.6.0-devel-ubuntu22.04 \ + nvidia/cuda:${CUDA_VERSION}-devel-ubuntu22.04 \ /bin/bash -c " # 安装系统依赖 apt-get update && \ @@ -68,7 +68,7 @@ jobs: ninja && \ # 构建 CUDA 执行器 - cd ../../op-mem-cuda && \ + cd ../../op-cuda && \ mkdir -p build && cd build && \ cmake -DCMAKE_BUILD_TYPE=Release \ -DCMAKE_CXX_COMPILER_LAUNCHER=ccache \ diff --git a/executor/op-mem-cuda/.gitignore b/executor/op-cuda/.gitignore similarity index 100% rename from executor/op-mem-cuda/.gitignore rename to executor/op-cuda/.gitignore diff --git a/executor/op-mem-cuda/CMakeLists.txt b/executor/op-cuda/CMakeLists.txt similarity index 100% rename from executor/op-mem-cuda/CMakeLists.txt rename to executor/op-cuda/CMakeLists.txt diff --git a/executor/op-mem-cuda/Dockerfile b/executor/op-cuda/Dockerfile similarity index 100% rename from executor/op-mem-cuda/Dockerfile rename to executor/op-cuda/Dockerfile diff --git a/executor/op-mem-cuda/README.md b/executor/op-cuda/README.md similarity index 100% rename from executor/op-mem-cuda/README.md rename to executor/op-cuda/README.md diff --git a/executor/op-cuda/build.sh b/executor/op-cuda/build.sh new file mode 100644 index 00000000..6b33ddb8 --- /dev/null +++ b/executor/op-cuda/build.sh @@ -0,0 +1,4 @@ +mkdir -p build && cd build +rm -rf build/* +cmake .. +make -j$(nproc) diff --git a/executor/op-mem-cuda/dockerbuild.sh b/executor/op-cuda/dockerbuild.sh similarity index 100% rename from executor/op-mem-cuda/dockerbuild.sh rename to executor/op-cuda/dockerbuild.sh diff --git a/executor/op-mem-cuda/log.md b/executor/op-cuda/log.md similarity index 100% rename from executor/op-mem-cuda/log.md rename to executor/op-cuda/log.md diff --git a/executor/op-mem-cuda/src/client/main.cpp b/executor/op-cuda/src/client/main.cpp similarity index 100% rename from executor/op-mem-cuda/src/client/main.cpp rename to executor/op-cuda/src/client/main.cpp diff --git a/executor/op-mem-cuda/src/client/tfs.cpp b/executor/op-cuda/src/client/tfs.cpp similarity index 100% rename from executor/op-mem-cuda/src/client/tfs.cpp rename to executor/op-cuda/src/client/tfs.cpp diff --git a/executor/op-mem-cuda/src/client/tfs.hpp b/executor/op-cuda/src/client/tfs.hpp similarity index 100% rename from executor/op-mem-cuda/src/client/tfs.hpp rename to executor/op-cuda/src/client/tfs.hpp diff --git a/executor/op-mem-cuda/src/deepx/dtype_cuda.hpp b/executor/op-cuda/src/deepx/dtype_cuda.hpp similarity index 100% rename from executor/op-mem-cuda/src/deepx/dtype_cuda.hpp rename to executor/op-cuda/src/deepx/dtype_cuda.hpp diff --git a/executor/op-mem-cuda/src/deepx/mem/mem_cuda.hpp b/executor/op-cuda/src/deepx/mem/mem_cuda.hpp similarity index 100% rename from executor/op-mem-cuda/src/deepx/mem/mem_cuda.hpp rename to executor/op-cuda/src/deepx/mem/mem_cuda.hpp diff --git a/executor/op-mem-cuda/src/deepx/tensorfunc/changeshape_miaobyte.cu b/executor/op-cuda/src/deepx/tensorfunc/changeshape_miaobyte.cu similarity index 100% rename from executor/op-mem-cuda/src/deepx/tensorfunc/changeshape_miaobyte.cu rename to executor/op-cuda/src/deepx/tensorfunc/changeshape_miaobyte.cu diff --git a/executor/op-mem-cuda/src/deepx/tensorfunc/changeshape_miaobyte.cuh b/executor/op-cuda/src/deepx/tensorfunc/changeshape_miaobyte.cuh similarity index 100% rename from executor/op-mem-cuda/src/deepx/tensorfunc/changeshape_miaobyte.cuh rename to executor/op-cuda/src/deepx/tensorfunc/changeshape_miaobyte.cuh diff --git a/executor/op-mem-cuda/src/deepx/tensorfunc/changeshape_miaobyte.hpp b/executor/op-cuda/src/deepx/tensorfunc/changeshape_miaobyte.hpp similarity index 100% rename from executor/op-mem-cuda/src/deepx/tensorfunc/changeshape_miaobyte.hpp rename to executor/op-cuda/src/deepx/tensorfunc/changeshape_miaobyte.hpp diff --git a/executor/op-mem-cuda/src/deepx/tensorfunc/cuda.hpp b/executor/op-cuda/src/deepx/tensorfunc/cuda.hpp similarity index 100% rename from executor/op-mem-cuda/src/deepx/tensorfunc/cuda.hpp rename to executor/op-cuda/src/deepx/tensorfunc/cuda.hpp diff --git a/executor/op-mem-cuda/src/deepx/tensorfunc/cuda_atomic.cuh b/executor/op-cuda/src/deepx/tensorfunc/cuda_atomic.cuh similarity index 100% rename from executor/op-mem-cuda/src/deepx/tensorfunc/cuda_atomic.cuh rename to executor/op-cuda/src/deepx/tensorfunc/cuda_atomic.cuh diff --git a/executor/op-mem-cuda/src/deepx/tensorfunc/cuda_math.cuh b/executor/op-cuda/src/deepx/tensorfunc/cuda_math.cuh similarity index 100% rename from executor/op-mem-cuda/src/deepx/tensorfunc/cuda_math.cuh rename to executor/op-cuda/src/deepx/tensorfunc/cuda_math.cuh diff --git a/executor/op-mem-cuda/src/deepx/tensorfunc/elementwise_cublas_basic.hpp b/executor/op-cuda/src/deepx/tensorfunc/elementwise_cublas_basic.hpp similarity index 100% rename from executor/op-mem-cuda/src/deepx/tensorfunc/elementwise_cublas_basic.hpp rename to executor/op-cuda/src/deepx/tensorfunc/elementwise_cublas_basic.hpp diff --git a/executor/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_basic.cu b/executor/op-cuda/src/deepx/tensorfunc/elementwise_miaobyte_basic.cu similarity index 100% rename from executor/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_basic.cu rename to executor/op-cuda/src/deepx/tensorfunc/elementwise_miaobyte_basic.cu diff --git a/executor/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_basic.cuh b/executor/op-cuda/src/deepx/tensorfunc/elementwise_miaobyte_basic.cuh similarity index 100% rename from executor/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_basic.cuh rename to executor/op-cuda/src/deepx/tensorfunc/elementwise_miaobyte_basic.cuh diff --git a/executor/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_basic.hpp b/executor/op-cuda/src/deepx/tensorfunc/elementwise_miaobyte_basic.hpp similarity index 100% rename from executor/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_basic.hpp rename to executor/op-cuda/src/deepx/tensorfunc/elementwise_miaobyte_basic.hpp diff --git a/executor/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_compare.cu b/executor/op-cuda/src/deepx/tensorfunc/elementwise_miaobyte_compare.cu similarity index 100% rename from executor/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_compare.cu rename to executor/op-cuda/src/deepx/tensorfunc/elementwise_miaobyte_compare.cu diff --git a/executor/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_compare.cuh b/executor/op-cuda/src/deepx/tensorfunc/elementwise_miaobyte_compare.cuh similarity index 100% rename from executor/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_compare.cuh rename to executor/op-cuda/src/deepx/tensorfunc/elementwise_miaobyte_compare.cuh diff --git a/executor/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_compare.hpp b/executor/op-cuda/src/deepx/tensorfunc/elementwise_miaobyte_compare.hpp similarity index 100% rename from executor/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_compare.hpp rename to executor/op-cuda/src/deepx/tensorfunc/elementwise_miaobyte_compare.hpp diff --git a/executor/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_sin.cu b/executor/op-cuda/src/deepx/tensorfunc/elementwise_miaobyte_sin.cu similarity index 100% rename from executor/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_sin.cu rename to executor/op-cuda/src/deepx/tensorfunc/elementwise_miaobyte_sin.cu diff --git a/executor/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_sin.cuh b/executor/op-cuda/src/deepx/tensorfunc/elementwise_miaobyte_sin.cuh similarity index 100% rename from executor/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_sin.cuh rename to executor/op-cuda/src/deepx/tensorfunc/elementwise_miaobyte_sin.cuh diff --git a/executor/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_sin.hpp b/executor/op-cuda/src/deepx/tensorfunc/elementwise_miaobyte_sin.hpp similarity index 100% rename from executor/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_sin.hpp rename to executor/op-cuda/src/deepx/tensorfunc/elementwise_miaobyte_sin.hpp diff --git a/executor/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_sqrt.cu b/executor/op-cuda/src/deepx/tensorfunc/elementwise_miaobyte_sqrt.cu similarity index 100% rename from executor/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_sqrt.cu rename to executor/op-cuda/src/deepx/tensorfunc/elementwise_miaobyte_sqrt.cu diff --git a/executor/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_sqrt.cuh b/executor/op-cuda/src/deepx/tensorfunc/elementwise_miaobyte_sqrt.cuh similarity index 100% rename from executor/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_sqrt.cuh rename to executor/op-cuda/src/deepx/tensorfunc/elementwise_miaobyte_sqrt.cuh diff --git a/executor/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_sqrt.hpp b/executor/op-cuda/src/deepx/tensorfunc/elementwise_miaobyte_sqrt.hpp similarity index 100% rename from executor/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_sqrt.hpp rename to executor/op-cuda/src/deepx/tensorfunc/elementwise_miaobyte_sqrt.hpp diff --git a/executor/op-mem-cuda/src/deepx/tensorfunc/init_miaobyte.cu b/executor/op-cuda/src/deepx/tensorfunc/init_miaobyte.cu similarity index 100% rename from executor/op-mem-cuda/src/deepx/tensorfunc/init_miaobyte.cu rename to executor/op-cuda/src/deepx/tensorfunc/init_miaobyte.cu diff --git a/executor/op-mem-cuda/src/deepx/tensorfunc/init_miaobyte.cuh b/executor/op-cuda/src/deepx/tensorfunc/init_miaobyte.cuh similarity index 100% rename from executor/op-mem-cuda/src/deepx/tensorfunc/init_miaobyte.cuh rename to executor/op-cuda/src/deepx/tensorfunc/init_miaobyte.cuh diff --git a/executor/op-mem-cuda/src/deepx/tensorfunc/init_miaobyte.hpp b/executor/op-cuda/src/deepx/tensorfunc/init_miaobyte.hpp similarity index 100% rename from executor/op-mem-cuda/src/deepx/tensorfunc/init_miaobyte.hpp rename to executor/op-cuda/src/deepx/tensorfunc/init_miaobyte.hpp diff --git a/executor/op-mem-cuda/src/deepx/tensorfunc/io_miaobyte.hpp b/executor/op-cuda/src/deepx/tensorfunc/io_miaobyte.hpp similarity index 100% rename from executor/op-mem-cuda/src/deepx/tensorfunc/io_miaobyte.hpp rename to executor/op-cuda/src/deepx/tensorfunc/io_miaobyte.hpp diff --git a/executor/op-mem-cuda/src/deepx/tensorfunc/matmul_cublas.hpp b/executor/op-cuda/src/deepx/tensorfunc/matmul_cublas.hpp similarity index 100% rename from executor/op-mem-cuda/src/deepx/tensorfunc/matmul_cublas.hpp rename to executor/op-cuda/src/deepx/tensorfunc/matmul_cublas.hpp diff --git a/executor/op-mem-cuda/src/deepx/tensorfunc/new_mempool.hpp b/executor/op-cuda/src/deepx/tensorfunc/new_mempool.hpp similarity index 100% rename from executor/op-mem-cuda/src/deepx/tensorfunc/new_mempool.hpp rename to executor/op-cuda/src/deepx/tensorfunc/new_mempool.hpp diff --git a/executor/op-mem-cuda/src/deepx/tensorfunc/reduce_miaobyte.cu b/executor/op-cuda/src/deepx/tensorfunc/reduce_miaobyte.cu similarity index 100% rename from executor/op-mem-cuda/src/deepx/tensorfunc/reduce_miaobyte.cu rename to executor/op-cuda/src/deepx/tensorfunc/reduce_miaobyte.cu diff --git a/executor/op-mem-cuda/src/deepx/tensorfunc/reduce_miaobyte.cuh b/executor/op-cuda/src/deepx/tensorfunc/reduce_miaobyte.cuh similarity index 100% rename from executor/op-mem-cuda/src/deepx/tensorfunc/reduce_miaobyte.cuh rename to executor/op-cuda/src/deepx/tensorfunc/reduce_miaobyte.cuh diff --git a/executor/op-mem-cuda/src/deepx/tensorfunc/reduce_miaobyte.hpp b/executor/op-cuda/src/deepx/tensorfunc/reduce_miaobyte.hpp similarity index 100% rename from executor/op-mem-cuda/src/deepx/tensorfunc/reduce_miaobyte.hpp rename to executor/op-cuda/src/deepx/tensorfunc/reduce_miaobyte.hpp diff --git a/executor/op-mem-cuda/src/deepx/tensorfunc/tensor_cuda.cuh b/executor/op-cuda/src/deepx/tensorfunc/tensor_cuda.cuh similarity index 100% rename from executor/op-mem-cuda/src/deepx/tensorfunc/tensor_cuda.cuh rename to executor/op-cuda/src/deepx/tensorfunc/tensor_cuda.cuh diff --git a/executor/op-mem-cuda/src/deepx/tensorfunc/tensorlife_miaobyte.hpp b/executor/op-cuda/src/deepx/tensorfunc/tensorlife_miaobyte.hpp similarity index 100% rename from executor/op-mem-cuda/src/deepx/tensorfunc/tensorlife_miaobyte.hpp rename to executor/op-cuda/src/deepx/tensorfunc/tensorlife_miaobyte.hpp diff --git a/executor/op-mem-cuda/src/deepx/tensorfunc/vector_cuda.cuh b/executor/op-cuda/src/deepx/tensorfunc/vector_cuda.cuh similarity index 100% rename from executor/op-mem-cuda/src/deepx/tensorfunc/vector_cuda.cuh rename to executor/op-cuda/src/deepx/tensorfunc/vector_cuda.cuh diff --git a/executor/op-mem-cuda/src/deepx/tf/arg.hpp b/executor/op-cuda/src/deepx/tf/arg.hpp similarity index 100% rename from executor/op-mem-cuda/src/deepx/tf/arg.hpp rename to executor/op-cuda/src/deepx/tf/arg.hpp diff --git a/executor/op-mem-cuda/src/deepx/tf/changeshape.hpp b/executor/op-cuda/src/deepx/tf/changeshape.hpp similarity index 100% rename from executor/op-mem-cuda/src/deepx/tf/changeshape.hpp rename to executor/op-cuda/src/deepx/tf/changeshape.hpp diff --git a/executor/op-mem-cuda/src/deepx/tf/elementwise_basic.hpp b/executor/op-cuda/src/deepx/tf/elementwise_basic.hpp similarity index 100% rename from executor/op-mem-cuda/src/deepx/tf/elementwise_basic.hpp rename to executor/op-cuda/src/deepx/tf/elementwise_basic.hpp diff --git a/executor/op-mem-cuda/src/deepx/tf/elementwise_compare.hpp b/executor/op-cuda/src/deepx/tf/elementwise_compare.hpp similarity index 100% rename from executor/op-mem-cuda/src/deepx/tf/elementwise_compare.hpp rename to executor/op-cuda/src/deepx/tf/elementwise_compare.hpp diff --git a/executor/op-mem-cuda/src/deepx/tf/elementwise_sin.hpp b/executor/op-cuda/src/deepx/tf/elementwise_sin.hpp similarity index 100% rename from executor/op-mem-cuda/src/deepx/tf/elementwise_sin.hpp rename to executor/op-cuda/src/deepx/tf/elementwise_sin.hpp diff --git a/executor/op-mem-cuda/src/deepx/tf/elementwise_sqrt.hpp b/executor/op-cuda/src/deepx/tf/elementwise_sqrt.hpp similarity index 100% rename from executor/op-mem-cuda/src/deepx/tf/elementwise_sqrt.hpp rename to executor/op-cuda/src/deepx/tf/elementwise_sqrt.hpp diff --git a/executor/op-mem-cuda/src/deepx/tf/init.hpp b/executor/op-cuda/src/deepx/tf/init.hpp similarity index 100% rename from executor/op-mem-cuda/src/deepx/tf/init.hpp rename to executor/op-cuda/src/deepx/tf/init.hpp diff --git a/executor/op-mem-cuda/src/deepx/tf/io.hpp b/executor/op-cuda/src/deepx/tf/io.hpp similarity index 100% rename from executor/op-mem-cuda/src/deepx/tf/io.hpp rename to executor/op-cuda/src/deepx/tf/io.hpp diff --git a/executor/op-mem-cuda/src/deepx/tf/matmul.hpp b/executor/op-cuda/src/deepx/tf/matmul.hpp similarity index 100% rename from executor/op-mem-cuda/src/deepx/tf/matmul.hpp rename to executor/op-cuda/src/deepx/tf/matmul.hpp diff --git a/executor/op-mem-cuda/src/deepx/tf/reduce.hpp b/executor/op-cuda/src/deepx/tf/reduce.hpp similarity index 100% rename from executor/op-mem-cuda/src/deepx/tf/reduce.hpp rename to executor/op-cuda/src/deepx/tf/reduce.hpp diff --git a/executor/op-mem-cuda/src/deepx/tf/tensorlife.hpp b/executor/op-cuda/src/deepx/tf/tensorlife.hpp similarity index 100% rename from executor/op-mem-cuda/src/deepx/tf/tensorlife.hpp rename to executor/op-cuda/src/deepx/tf/tensorlife.hpp diff --git a/executor/op-mem-cuda/test/op/CMakeLists.txt b/executor/op-cuda/test/op/CMakeLists.txt similarity index 100% rename from executor/op-mem-cuda/test/op/CMakeLists.txt rename to executor/op-cuda/test/op/CMakeLists.txt diff --git a/executor/op-mem-cuda/test/tensorfunc/0_new.cpp b/executor/op-cuda/test/tensorfunc/0_new.cpp similarity index 100% rename from executor/op-mem-cuda/test/tensorfunc/0_new.cpp rename to executor/op-cuda/test/tensorfunc/0_new.cpp diff --git a/executor/op-mem-cuda/test/tensorfunc/1_cublas_add.cpp b/executor/op-cuda/test/tensorfunc/1_cublas_add.cpp similarity index 100% rename from executor/op-mem-cuda/test/tensorfunc/1_cublas_add.cpp rename to executor/op-cuda/test/tensorfunc/1_cublas_add.cpp diff --git a/executor/op-mem-cuda/test/tensorfunc/1_cublas_matmul.cpp b/executor/op-cuda/test/tensorfunc/1_cublas_matmul.cpp similarity index 100% rename from executor/op-mem-cuda/test/tensorfunc/1_cublas_matmul.cpp rename to executor/op-cuda/test/tensorfunc/1_cublas_matmul.cpp diff --git a/executor/op-mem-cuda/test/tensorfunc/2_changeshape.cpp b/executor/op-cuda/test/tensorfunc/2_changeshape.cpp similarity index 100% rename from executor/op-mem-cuda/test/tensorfunc/2_changeshape.cpp rename to executor/op-cuda/test/tensorfunc/2_changeshape.cpp diff --git a/executor/op-mem-cuda/test/tensorfunc/CMakeLists.txt b/executor/op-cuda/test/tensorfunc/CMakeLists.txt similarity index 100% rename from executor/op-mem-cuda/test/tensorfunc/CMakeLists.txt rename to executor/op-cuda/test/tensorfunc/CMakeLists.txt diff --git a/executor/op-mem-cuda/build.sh b/executor/op-mem-cuda/build.sh deleted file mode 100644 index bc8e0b91..00000000 --- a/executor/op-mem-cuda/build.sh +++ /dev/null @@ -1,4 +0,0 @@ -cd build -rm -rf * -cmake .. -make -j$(nproc)