From f71f809bfd2b3ce3280d5ff440c854ad891d23b0 Mon Sep 17 00:00:00 2001
From: miaobyte <734991033@qq.com>
Date: Thu, 20 Mar 2025 16:04:06 +0800
Subject: [PATCH 1/5] excuter(cpu/cuda):subscalar

---
 doc/excuter/op-mem-cuda/list.md               |   2 +
 doc/excuter/op-mem-ompsimd/list.md            |   1 +
 .../src/deepx/tensorfunc/elementwise.hpp      |  12 +-
 excuter/op-mem-cuda/src/client/tfs.cpp        |  13 +-
 .../tensorfunc/elementwise_miaobyte_basic.cu  |  29 ++-
 .../tensorfunc/elementwise_miaobyte_basic.cuh |  33 ++-
 .../tensorfunc/elementwise_miaobyte_basic.hpp |  14 ++
 .../src/deepx/tf/elementwise_basic.hpp        |  82 ++++++-
 excuter/op-mem-ompsimd/src/client/tfs.cpp     |  10 +
 .../src/deepx/tf/elementwise.hpp              | 222 +++++++++++-------
 10 files changed, 320 insertions(+), 98 deletions(-)
diff --git a/doc/excuter/op-mem-cuda/list.md b/doc/excuter/op-mem-cuda/list.md
index 171779a4..9913a248 100644
--- a/doc/excuter/op-mem-cuda/list.md
+++ b/doc/excuter/op-mem-cuda/list.md
@@ -5,8 +5,10 @@
 | Operation | Author | Func Def | Math Formula | IR Instruction |
 |-----------|--------|------------|--------------|----------------|
 | addscalar | miaobyte | addscalar(tensor<any> A, var<any> b)->(tensor<any> C) | T3=T1+scalar | addscalar(tensor<any> A, var<any> b)->(tensor<any> C) |
+| add | cublas | add(tensor<any> a, tensor<any> b)->(tensor<any> c) | T3=T1+T2 | add(tensor<any> a, tensor<any> b)->(tensor<any> c) |
 | add | miaobyte | add(tensor<any> a, tensor<any> b)->(tensor<any> c) | T3=T1+T2 | add(tensor<any> a, tensor<any> b)->(tensor<any> c) |
 | uniform | miaobyte | uniform(tensor<any> t, var<any> low, var<any> high, var<int32> seed)->() | uniform(T1,low,high,seed) | uniform(tensor<any> t, var<any> low, var<any> high, var<int32> seed)->() |
+| subscalar | miaobyte | subscalar(tensor<any> A, var<any> b)->(tensor<any> C) | T3=T1-scalar | subscalar(tensor<any> A, var<any> b)->(tensor<any> C) |
 | arange | miaobyte | arange(tensor<any> t, var<any> start, var<any> step)->() | arange(T1,start,step) | arange(tensor<any> t, var<any> start, var<any> step)->() |
 | constant | miaobyte | constant(tensor<any> t, var<any> value)->() | constant(T1) | constant(tensor<any> t, var<any> value)->() |
 | print | miaobyte | print(tensor<any> )->() | print(T1) | print(tensor<any> )->() |
diff --git a/doc/excuter/op-mem-ompsimd/list.md b/doc/excuter/op-mem-ompsimd/list.md
index 581ab8f9..f10183f4 100644
--- a/doc/excuter/op-mem-ompsimd/list.md
+++ b/doc/excuter/op-mem-ompsimd/list.md
@@ -9,6 +9,7 @@
 | add | cblas | add(tensor<float64|float32> a, tensor<float64|float32> b)->(tensor<float64|float32> c) | T3=T1+T2 | add(tensor<float64|float32> a, tensor<float64|float32> b)->(tensor<float64|float32> c) |
 | add | miaobyte | add(tensor<any> a, tensor<any> b)->(tensor<any> c) | T3=T1+T2 | add(tensor<any> a, tensor<any> b)->(tensor<any> c) |
 | uniform | miaobyte | uniform(tensor<any> t, var<any> low, var<any> high, var<int32> seed)->() | uniform(T1,low,high,seed) | uniform(tensor<any> t, var<any> low, var<any> high, var<int32> seed)->() |
+| subscalar | miaobyte | subscalar(tensor<any> a, var<any> scalar)->(tensor<any> c) | T3=T1-scalar | subscalar(tensor<any> a, var<any> scalar)->(tensor<any> c) |
 | arange | miaobyte | arange(tensor<any> t, var<any> start, var<any> step)->() | arange(T1,start,step) | arange(tensor<any> t, var<any> start, var<any> step)->() |
 | constant | miaobyte | constant(tensor<any> t, var<any> value)->() | constant(T1,value) | constant(tensor<any> t, var<any> value)->() |
 | print | miaobyte | print(tensor<any> )->() | print(T1) | print(tensor<any> )->() |
diff --git a/excuter/cpp-common/src/deepx/tensorfunc/elementwise.hpp b/excuter/cpp-common/src/deepx/tensorfunc/elementwise.hpp
index bf6fd053..e05506f7 100644
--- a/excuter/cpp-common/src/deepx/tensorfunc/elementwise.hpp
+++ b/excuter/cpp-common/src/deepx/tensorfunc/elementwise.hpp
@@ -24,7 +24,9 @@ namespace deepx::tensorfunc
     template <typename Author, typename T>
     struct addscalarDispatcher
     {
-        static void addscalar(const Tensor<T> &input, const T value, Tensor<T> &output) = delete;
+        static void addscalar(const Tensor<T> &input, const T value, Tensor<T> &output){
+            throw NotImplementError("addscalar");
+        }
     };
 
     template <typename Author, typename T>
@@ -36,7 +38,9 @@ namespace deepx::tensorfunc
     template <typename Author, typename T>
     struct subDispatcher
     {
-        static void sub(const Tensor<T> &A, const Tensor<T> &B, Tensor<T> &C) = delete;
+        static void sub(const Tensor<T> &A, const Tensor<T> &B, Tensor<T> &C){
+            throw NotImplementError("sub");
+        }
     };
 
     template <typename Author, typename T>
@@ -48,7 +52,9 @@ namespace deepx::tensorfunc
     template <typename Author, typename T>
     struct subscalarDispatcher
     {
-        static void subscalar(const Tensor<T> &input, const T value, Tensor<T> &output) = delete;
+        static void subscalar(const Tensor<T> &input, const T value, Tensor<T> &output){
+            throw NotImplementError("subscalar");
+        }
     };
 
     template <typename Author, typename T>
diff --git a/excuter/op-mem-cuda/src/client/tfs.cpp b/excuter/op-mem-cuda/src/client/tfs.cpp
index 41108a7f..cfcbec3b 100644
--- a/excuter/op-mem-cuda/src/client/tfs.cpp
+++ b/excuter/op-mem-cuda/src/client/tfs.cpp
@@ -114,7 +114,7 @@ namespace deepx::tf
                                                              {
                                                                  Param("c", DataCategory::Tensor, Precision::Any),
                                                              })));
-        tffactory.add_tf(std::make_shared<Addscalar<miaobyte>>(vector<Param>(
+        tffactory.add_tf(std::make_shared<AddScalar<miaobyte>>(vector<Param>(
                                                                    {
                                                                        Param("A", DataCategory::Tensor, Precision::Any),
                                                                        Param("b", DataCategory::Var, Precision::Any),
@@ -133,7 +133,16 @@ namespace deepx::tf
                                                                    {
                                                                        Param("C", DataCategory::Tensor, Precision::Any),
                                                                    })));
-        
+        tffactory.add_tf(std::make_shared<SubScalar<miaobyte>>(vector<Param>(
+                                                                   {
+                                                                       Param("A", DataCategory::Tensor, Precision::Any),
+                                                                       Param("b", DataCategory::Var, Precision::Any),
+                                                                   }),
+                                                               vector<Param>(
+                                                                   {
+                                                                       Param("C", DataCategory::Tensor, Precision::Any),
+                                                                   })));
+
         //     opfactory.add_op(Sub_cblas<float>());
         //     opfactory.add_op(Sub_cblas<double>());
 
diff --git a/excuter/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_basic.cu b/excuter/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_basic.cu
index f66950ac..f4836cd6 100644
--- a/excuter/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_basic.cu
+++ b/excuter/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_basic.cu
@@ -105,7 +105,34 @@ namespace deepx::tensorfunc
     template void launch_sub<int16_t>(const int numBlocks, const int blockSize, const int16_t* a, const int16_t* b, int16_t* c, const int size);
     template void launch_sub<int8_t>(const int numBlocks, const int blockSize, const int8_t* a, const int8_t* b, int8_t* c, const int size);    
     
-    
+    template <typename T>
+    __global__ void subscalar_kernel(const T* A, const T scalar, T* C,const int size){
+        int idx = blockIdx.x * blockDim.x + threadIdx.x;
+        if (idx < size) {
+            C[idx] = A[idx] - scalar;
+        }
+    }   
+    template __global__ void subscalar_kernel<double>(const double* A, const double scalar, double* C,const int size);
+    template __global__ void subscalar_kernel<float>(const float* A, const float scalar, float* C,const int size);
+    template __global__ void subscalar_kernel<half>(const half* A, const half scalar, half* C,const int size);
+    template __global__ void subscalar_kernel<nv_bfloat16>(const nv_bfloat16* A, const nv_bfloat16 scalar, nv_bfloat16* C,const int size);
+    template __global__ void subscalar_kernel<int64_t>(const int64_t* A, const int64_t scalar, int64_t* C,const int size);  
+    template __global__ void subscalar_kernel<int32_t>(const int32_t* A, const int32_t scalar, int32_t* C,const int size);  
+    template __global__ void subscalar_kernel<int16_t>(const int16_t* A, const int16_t scalar, int16_t* C,const int size);  
+    template __global__ void subscalar_kernel<int8_t>(const int8_t* A, const int8_t scalar, int8_t* C,const int size);  
+
+    template <typename T>
+    void launch_subscalar(const int numBlocks, const int blockSize, const T* a, const T scalar, T* c, const int size) { 
+        subscalar_kernel<<<numBlocks, blockSize>>>(a, scalar, c, size);
+    }
+    template void launch_subscalar<double>(const int numBlocks, const int blockSize, const double* a, const double scalar, double* c, const int size);
+    template void launch_subscalar<float>(const int numBlocks, const int blockSize, const float* a, const float scalar, float* c, const int size);
+    template void launch_subscalar<half>(const int numBlocks, const int blockSize, const half* a, const half scalar, half* c, const int size);
+    template void launch_subscalar<nv_bfloat16>(const int numBlocks, const int blockSize, const nv_bfloat16* a, const nv_bfloat16 scalar, nv_bfloat16* c, const int size);  
+    template void launch_subscalar<int64_t>(const int numBlocks, const int blockSize, const int64_t* a, const int64_t scalar, int64_t* c, const int size);  
+    template void launch_subscalar<int32_t>(const int numBlocks, const int blockSize, const int32_t* a, const int32_t scalar, int32_t* c, const int size);  
+    template void launch_subscalar<int16_t>(const int numBlocks, const int blockSize, const int16_t* a, const int16_t scalar, int16_t* c, const int size);  
+    template void launch_subscalar<int8_t>(const int numBlocks, const int blockSize, const int8_t* a, const int8_t scalar, int8_t* c, const int size);    
 }
 
 #endif // DEEPX_TENSORFUNC_ELEMENTWISE_MIAO_BYTE_BASIC_CUH
diff --git a/excuter/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_basic.cuh b/excuter/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_basic.cuh
index 77102fc9..966cfa1c 100644
--- a/excuter/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_basic.cuh
+++ b/excuter/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_basic.cuh
@@ -103,7 +103,38 @@ namespace deepx::tensorfunc
 
     template <> 
     void launch_sub<int8_t>(int numBlocks, int blockSize, const int8_t* a, const int8_t* b, int8_t* c,const int size);
-    
+
+    // subscalar
+    template <typename T>
+    __global__ void subscalar_kernel(const T* A, const T scalar, T* C,const int size);
+
+    template <typename T>
+    void launch_subscalar(const int numBlocks, const int blockSize, const T* a, const T scalar, T* c,const int size);
+
+    template <>
+    void launch_subscalar<double>(const int numBlocks, const int blockSize, const double* a, const double scalar, double* c,const int size);
+
+    template <>
+    void launch_subscalar<float>(const int numBlocks, const int blockSize, const float* a, const float scalar, float* c,const int size);
+
+    template <>
+    void launch_subscalar<nv_bfloat16>(const int numBlocks, const int blockSize, const nv_bfloat16* a, const nv_bfloat16 scalar, nv_bfloat16* c,const int size);
+
+    template <>
+    void launch_subscalar<__half>(const int numBlocks, const int blockSize, const __half* a, const __half scalar, __half* c,const int size);
+
+    template <>
+    void launch_subscalar<int64_t>(const int numBlocks, const int blockSize, const int64_t* a, const int64_t scalar, int64_t* c,const int size);
+
+    template <>
+    void launch_subscalar<int32_t>(const int numBlocks, const int blockSize, const int32_t* a, const int32_t scalar, int32_t* c,const int size);
+
+    template <>
+    void launch_subscalar<int16_t>(const int numBlocks, const int blockSize, const int16_t* a, const int16_t scalar, int16_t* c,const int size);
+
+    template <>
+    void launch_subscalar<int8_t>(const int numBlocks, const int blockSize, const int8_t* a, const int8_t scalar, int8_t* c,const int size);    
+ 
 }
 
 #endif // DEEPX_TENSORFUNC_ELEMENTWISE_MIAO_BYTE_BASIC_CUH
diff --git a/excuter/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_basic.hpp b/excuter/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_basic.hpp
index 2da8ec9c..0500dd60 100644
--- a/excuter/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_basic.hpp
+++ b/excuter/op-mem-cuda/src/deepx/tensorfunc/elementwise_miaobyte_basic.hpp
@@ -55,6 +55,20 @@ namespace deepx::tensorfunc
             launch_sub(numBlocks, blockSize, A.data, B.data, C.data, A.shape.size);
         }
     };
+
+    template <typename T>
+    struct subscalarDispatcher<miaobyte, T>
+    {
+        static void subscalar(const Tensor<T> &A, const T scalar, Tensor<T> &C)
+        {
+            if (A.shape.size != C.shape.size) { 
+                throw TensorShapeError("subscalar");
+            }
+            const int blockSize = A.shape.size > 256 ? 256 : A.shape.size;
+            int numBlocks = (A.shape.size + blockSize - 1) / blockSize;
+            launch_subscalar(numBlocks, blockSize, A.data, scalar, C.data, A.shape.size);
+        }
+    };  
 }
 
 #endif // DEEPX_TENSORFUNC_ELEMENTWISE_MIAO_BYTE_BASIC_HPP
diff --git a/excuter/op-mem-cuda/src/deepx/tf/elementwise_basic.hpp b/excuter/op-mem-cuda/src/deepx/tf/elementwise_basic.hpp
index 218432a8..c0910a99 100644
--- a/excuter/op-mem-cuda/src/deepx/tf/elementwise_basic.hpp
+++ b/excuter/op-mem-cuda/src/deepx/tf/elementwise_basic.hpp
@@ -83,10 +83,10 @@ namespace deepx::tf
     };
 
     template <typename Author>
-    class Addscalar : public TF
+    class AddScalar : public TF
     {
     public:
-        Addscalar(const vector<Param> &args, const vector<Param> &returns)
+        AddScalar(const vector<Param> &args, const vector<Param> &returns)
         {
             this->name = "addscalar";
             this->author = Author::name();
@@ -94,7 +94,7 @@ namespace deepx::tf
             this->returns = returns;
         }
 
-        Addscalar(string text)
+        AddScalar(string text)
         {
             this->parse(text);
             this->author = Author::name();
@@ -109,7 +109,7 @@ namespace deepx::tf
         }
         shared_ptr<TF> clone() const override
         {
-            return make_shared<Addscalar<Author>>(*this);
+            return make_shared<AddScalar<Author>>(*this);
         }
         int run(shared_ptr<MemBase> mem, string &error) override
         {
@@ -226,6 +226,80 @@ namespace deepx::tf
             return 0;
         }
     };
+
+    template <typename Author>
+    class SubScalar : public TF
+    {
+    public: 
+        SubScalar(const vector<Param> &args, const vector<Param> &returns)
+        {
+            this->name = "subscalar";
+            this->author = Author::name();
+            this->args = args;
+            this->returns = returns;
+        }
+
+        SubScalar(string text)
+        {
+            this->parse(text);
+            this->author = Author::name();
+            if (this->name != "subscalar")
+            {
+                throw std::runtime_error("Invalid name: " + this->name);
+            }
+        }
+        string math_formula() const override
+        {
+            return "T3=T1-scalar";
+        }
+        shared_ptr<TF> clone() const override
+        {
+            return make_shared<SubScalar<Author>>(*this);
+        }   
+        int run(shared_ptr<MemBase> mem, string &error) override
+        {
+            Precision a_type = mem->gettensor(this->args[0].textvalue).get()->shape.dtype;
+            Precision c_type = mem->gettensor(this->returns[0].textvalue).get()->shape.dtype;
+            if (a_type != c_type)
+            {
+                error = "Type mismatch: " + precision_str(a_type) + " != " + precision_str(c_type);
+                return 1;
+            }
+            switch (a_type)
+            {
+            case Precision::Float64:
+                tensorfunc::subscalar<Author, double>(*mem->gettensor<double>(this->args[0].textvalue), this->getvar<double>(1, mem), *mem->gettensor<double>(this->returns[0].textvalue));
+                break;
+            case Precision::Float32:
+                tensorfunc::subscalar<Author, float>(*mem->gettensor<float>(this->args[0].textvalue), this->getvar<float>(1, mem), *mem->gettensor<float>(this->returns[0].textvalue));
+                break;
+            case Precision::Float16:
+                tensorfunc::subscalar<Author, half>(*mem->gettensor<half>(this->args[0].textvalue), this->getvar<half>(1, mem), *mem->gettensor<half>(this->returns[0].textvalue));
+                break;
+            case Precision::BFloat16:
+                tensorfunc::subscalar<Author, nv_bfloat16>(*mem->gettensor<nv_bfloat16>(this->args[0].textvalue), this->getvar<nv_bfloat16>(1, mem), *mem->gettensor<nv_bfloat16>(this->returns[0].textvalue));
+                break;
+            case Precision::Int64:
+                tensorfunc::subscalar<Author, int32_t>(*mem->gettensor<int32_t>(this->args[0].textvalue), this->getvar<int32_t>(1, mem), *mem->gettensor<int32_t>(this->returns[0].textvalue));
+                break;
+            case Precision::Int32:
+                tensorfunc::subscalar<Author, int32_t>(*mem->gettensor<int32_t>(this->args[0].textvalue), this->getvar<int32_t>(1, mem), *mem->gettensor<int32_t>(this->returns[0].textvalue));
+                break;
+            case Precision::Int16:
+                tensorfunc::subscalar<Author, int16_t>(*mem->gettensor<int16_t>(this->args[0].textvalue), this->getvar<int16_t>(1, mem), *mem->gettensor<int16_t>(this->returns[0].textvalue));
+                break;  
+            case Precision::Int8:
+                tensorfunc::subscalar<Author, int8_t>(*mem->gettensor<int8_t>(this->args[0].textvalue), this->getvar<int8_t>(1, mem), *mem->gettensor<int8_t>(this->returns[0].textvalue));
+                break;
+            default:
+                error = "Unsupported dtype: " + precision_str(a_type);
+                return 1;
+            }
+            return 0;
+        }   
+    };
+ 
+    
 };
 
 #endif // DEEPX_TF_ELEMENTWISE_BASIC_HPP
diff --git a/excuter/op-mem-ompsimd/src/client/tfs.cpp b/excuter/op-mem-ompsimd/src/client/tfs.cpp
index 6bae8e79..b2de5145 100644
--- a/excuter/op-mem-ompsimd/src/client/tfs.cpp
+++ b/excuter/op-mem-ompsimd/src/client/tfs.cpp
@@ -140,6 +140,16 @@ namespace deepx::tf
                                                                  {
                                                                      Param("c", DataCategory::Tensor, Precision::Any),
                                                                  }))); 
+
+        tffactory.add_tf(std::make_shared<SubScalar<miaobyte>>(vector<Param>(
+                                                                 {
+                                                                     Param("a", DataCategory::Tensor, Precision::Any),
+                                                                     Param("scalar", DataCategory::Var, Precision::Any),
+                                                                 }),
+                                                             vector<Param>(
+                                                                 {
+                                                                     Param("c", DataCategory::Tensor, Precision::Any),
+                                                                 }))); 
         //     opfactory.add_op(Addscalar_miaobyte<float>());
         //     opfactory.add_op(Addscalar_miaobyte<double>());
 
diff --git a/excuter/op-mem-ompsimd/src/deepx/tf/elementwise.hpp b/excuter/op-mem-ompsimd/src/deepx/tf/elementwise.hpp
index 1702c644..5487a2a7 100644
--- a/excuter/op-mem-ompsimd/src/deepx/tf/elementwise.hpp
+++ b/excuter/op-mem-ompsimd/src/deepx/tf/elementwise.hpp
@@ -8,11 +8,13 @@
 #include "deepx/tensorfunc/authors.hpp"
 #include "deepx/tensorfunc/elementwise_miaobyte.hpp"
 #include "deepx/tensorfunc/elementwise_cblas.hpp"
-namespace deepx::tf {
+namespace deepx::tf
+{
 
     template <typename Author>
-    class Add : public TF {
-        public:
+    class Add : public TF
+    {
+    public:
         Add(vector<Param> args, vector<Param> returns)
         {
             this->name = "add";
@@ -23,7 +25,7 @@ namespace deepx::tf {
         string math_formula() const override
         {
             return "T3=T1+T2";
-        }   
+        }
         shared_ptr<TF> clone() const override
         {
             return make_shared<Add<Author>>(*this);
@@ -38,38 +40,38 @@ namespace deepx::tf {
                 error = "Type mismatch: " + precision_str(a_type) + " != " + precision_str(b_type) + " != " + precision_str(c_type);
                 return 1;
             }
-            switch (a_type) 
+            switch (a_type)
             {
-                case Precision::Float64:
-                    tensorfunc::add<Author, double>(*mem->gettensor<double>(this->args[0].textvalue), *mem->gettensor<double>(this->args[1].textvalue), *mem->gettensor<double>(this->returns[0].textvalue));
-                    break;
-                case Precision::Float32:
-                    tensorfunc::add<Author, float>(*mem->gettensor<float>(this->args[0].textvalue), *mem->gettensor<float>(this->args[1].textvalue), *mem->gettensor<float>(this->returns[0].textvalue));
-                    break;
-                case Precision::Int64:
-                    tensorfunc::add<Author, int32_t>(*mem->gettensor<int32_t>(this->args[0].textvalue), *mem->gettensor<int32_t>(this->args[1].textvalue), *mem->gettensor<int32_t>(this->returns[0].textvalue));
-                    break;
-                case Precision::Int32:
-                    tensorfunc::add<Author, int32_t>(*mem->gettensor<int32_t>(this->args[0].textvalue), *mem->gettensor<int32_t>(this->args[1].textvalue), *mem->gettensor<int32_t>(this->returns[0].textvalue));
-                    break;
-                case Precision::Int16:
-                    tensorfunc::add<Author, int16_t>(*mem->gettensor<int16_t>(this->args[0].textvalue), *mem->gettensor<int16_t>(this->args[1].textvalue), *mem->gettensor<int16_t>(this->returns[0].textvalue));
-                    break;
-                case Precision::Int8:
-                    tensorfunc::add<Author, int8_t>(*mem->gettensor<int8_t>(this->args[0].textvalue), *mem->gettensor<int8_t>(this->args[1].textvalue), *mem->gettensor<int8_t>(this->returns[0].textvalue));
-                    break;
-                default:
-                    error = "Unsupported dtype: " + precision_str(a_type);
-                    return 1;
+            case Precision::Float64:
+                tensorfunc::add<Author, double>(*mem->gettensor<double>(this->args[0].textvalue), *mem->gettensor<double>(this->args[1].textvalue), *mem->gettensor<double>(this->returns[0].textvalue));
+                break;
+            case Precision::Float32:
+                tensorfunc::add<Author, float>(*mem->gettensor<float>(this->args[0].textvalue), *mem->gettensor<float>(this->args[1].textvalue), *mem->gettensor<float>(this->returns[0].textvalue));
+                break;
+            case Precision::Int64:
+                tensorfunc::add<Author, int32_t>(*mem->gettensor<int32_t>(this->args[0].textvalue), *mem->gettensor<int32_t>(this->args[1].textvalue), *mem->gettensor<int32_t>(this->returns[0].textvalue));
+                break;
+            case Precision::Int32:
+                tensorfunc::add<Author, int32_t>(*mem->gettensor<int32_t>(this->args[0].textvalue), *mem->gettensor<int32_t>(this->args[1].textvalue), *mem->gettensor<int32_t>(this->returns[0].textvalue));
+                break;
+            case Precision::Int16:
+                tensorfunc::add<Author, int16_t>(*mem->gettensor<int16_t>(this->args[0].textvalue), *mem->gettensor<int16_t>(this->args[1].textvalue), *mem->gettensor<int16_t>(this->returns[0].textvalue));
+                break;
+            case Precision::Int8:
+                tensorfunc::add<Author, int8_t>(*mem->gettensor<int8_t>(this->args[0].textvalue), *mem->gettensor<int8_t>(this->args[1].textvalue), *mem->gettensor<int8_t>(this->returns[0].textvalue));
+                break;
+            default:
+                error = "Unsupported dtype: " + precision_str(a_type);
+                return 1;
             }
             return 0;
         }
-        
     };
 
     template <typename Author>
-    class AddScalar : public TF {
-        public:
+    class AddScalar : public TF
+    {
+    public:
         AddScalar(vector<Param> args, vector<Param> returns)
         {
             this->name = "addscalar";
@@ -80,7 +82,7 @@ namespace deepx::tf {
         string math_formula() const override
         {
             return "T3=T1+scalar";
-        }   
+        }
         shared_ptr<TF> clone() const override
         {
             return make_shared<AddScalar<Author>>(*this);
@@ -94,37 +96,37 @@ namespace deepx::tf {
                 error = "Type mismatch: " + precision_str(a_type) + " != " + precision_str(c_type);
                 return 1;
             }
-            switch (a_type) 
+            switch (a_type)
             {
-                case Precision::Float64:
-                    tensorfunc::addscalar<Author, double>(*mem->gettensor<double>(this->args[0].textvalue), this->getvar<double>(1, mem), *mem->gettensor<double>(this->returns[0].textvalue));
-                    break;
-                case Precision::Float32:
-                    tensorfunc::addscalar<Author, float>(*mem->gettensor<float>(this->args[0].textvalue), this->getvar<float>(1, mem), *mem->gettensor<float>(this->returns[0].textvalue));
-                    break;
-                case Precision::Int64:
-                    tensorfunc::addscalar<Author, int32_t>(*mem->gettensor<int32_t>(this->args[0].textvalue), this->getvar<int32_t>(1, mem), *mem->gettensor<int32_t>(this->returns[0].textvalue));
-                    break;
-                case Precision::Int32:
-                    tensorfunc::addscalar<Author, int32_t>(*mem->gettensor<int32_t>(this->args[0].textvalue), this->getvar<int32_t>(1, mem), *mem->gettensor<int32_t>(this->returns[0].textvalue));
-                    break;
-                case Precision::Int16:
-                    tensorfunc::addscalar<Author, int16_t>(*mem->gettensor<int16_t>(this->args[0].textvalue), this->getvar<int16_t>(1, mem), *mem->gettensor<int16_t>(this->returns[0].textvalue));
-                    break;
-                case Precision::Int8:
-                    tensorfunc::addscalar<Author, int8_t>(*mem->gettensor<int8_t>(this->args[0].textvalue), this->getvar<int8_t>(1, mem), *mem->gettensor<int8_t>(this->returns[0].textvalue));
-                    break;
-                default:
-                    error = "Unsupported dtype: " + precision_str(a_type);
-                    return 1;
+            case Precision::Float64:
+                tensorfunc::addscalar<Author, double>(*mem->gettensor<double>(this->args[0].textvalue), this->getvar<double>(1, mem), *mem->gettensor<double>(this->returns[0].textvalue));
+                break;
+            case Precision::Float32:
+                tensorfunc::addscalar<Author, float>(*mem->gettensor<float>(this->args[0].textvalue), this->getvar<float>(1, mem), *mem->gettensor<float>(this->returns[0].textvalue));
+                break;
+            case Precision::Int64:
+                tensorfunc::addscalar<Author, int32_t>(*mem->gettensor<int32_t>(this->args[0].textvalue), this->getvar<int32_t>(1, mem), *mem->gettensor<int32_t>(this->returns[0].textvalue));
+                break;
+            case Precision::Int32:
+                tensorfunc::addscalar<Author, int32_t>(*mem->gettensor<int32_t>(this->args[0].textvalue), this->getvar<int32_t>(1, mem), *mem->gettensor<int32_t>(this->returns[0].textvalue));
+                break;
+            case Precision::Int16:
+                tensorfunc::addscalar<Author, int16_t>(*mem->gettensor<int16_t>(this->args[0].textvalue), this->getvar<int16_t>(1, mem), *mem->gettensor<int16_t>(this->returns[0].textvalue));
+                break;
+            case Precision::Int8:
+                tensorfunc::addscalar<Author, int8_t>(*mem->gettensor<int8_t>(this->args[0].textvalue), this->getvar<int8_t>(1, mem), *mem->gettensor<int8_t>(this->returns[0].textvalue));
+                break;
+            default:
+                error = "Unsupported dtype: " + precision_str(a_type);
+                return 1;
             }
             return 0;
         }
-        
     };
     template <typename Author>
-    class Sub : public TF {
-        public:
+    class Sub : public TF
+    {
+    public:
         Sub(vector<Param> args, vector<Param> returns)
         {
             this->name = "sub";
@@ -135,7 +137,7 @@ namespace deepx::tf {
         string math_formula() const override
         {
             return "T3=T1-T2";
-        }   
+        }
         shared_ptr<TF> clone() const override
         {
             return make_shared<Sub<Author>>(*this);
@@ -150,43 +152,89 @@ namespace deepx::tf {
                 error = "Type mismatch: " + precision_str(a_type) + " != " + precision_str(b_type) + " != " + precision_str(c_type);
                 return 1;
             }
-            switch (a_type) 
+            switch (a_type)
             {
-                case Precision::Float64:
-                    tensorfunc::sub<Author, double>(*mem->gettensor<double>(this->args[0].textvalue), *mem->gettensor<double>(this->args[1].textvalue), *mem->gettensor<double>(this->returns[0].textvalue));
-                    break;
-                case Precision::Float32:
-                    tensorfunc::sub<Author, float>(*mem->gettensor<float>(this->args[0].textvalue), *mem->gettensor<float>(this->args[1].textvalue), *mem->gettensor<float>(this->returns[0].textvalue));
-                    break;
-                case Precision::Int64:
-                    tensorfunc::sub<Author, int32_t>(*mem->gettensor<int32_t>(this->args[0].textvalue), *mem->gettensor<int32_t>(this->args[1].textvalue), *mem->gettensor<int32_t>(this->returns[0].textvalue));
-                    break;
-                case Precision::Int32:
-                    tensorfunc::sub<Author, int32_t>(*mem->gettensor<int32_t>(this->args[0].textvalue), *mem->gettensor<int32_t>(this->args[1].textvalue), *mem->gettensor<int32_t>(this->returns[0].textvalue));
-                    break;
-                case Precision::Int16:
-                    tensorfunc::sub<Author, int16_t>(*mem->gettensor<int16_t>(this->args[0].textvalue), *mem->gettensor<int16_t>(this->args[1].textvalue), *mem->gettensor<int16_t>(this->returns[0].textvalue));
-                    break;
-                case Precision::Int8:
-                    tensorfunc::sub<Author, int8_t>(*mem->gettensor<int8_t>(this->args[0].textvalue), *mem->gettensor<int8_t>(this->args[1].textvalue), *mem->gettensor<int8_t>(this->returns[0].textvalue));
-                    break;
-                default:
-                    error = "Unsupported dtype: " + precision_str(a_type);
-                    return 1;
+            case Precision::Float64:
+                tensorfunc::sub<Author, double>(*mem->gettensor<double>(this->args[0].textvalue), *mem->gettensor<double>(this->args[1].textvalue), *mem->gettensor<double>(this->returns[0].textvalue));
+                break;
+            case Precision::Float32:
+                tensorfunc::sub<Author, float>(*mem->gettensor<float>(this->args[0].textvalue), *mem->gettensor<float>(this->args[1].textvalue), *mem->gettensor<float>(this->returns[0].textvalue));
+                break;
+            case Precision::Int64:
+                tensorfunc::sub<Author, int32_t>(*mem->gettensor<int32_t>(this->args[0].textvalue), *mem->gettensor<int32_t>(this->args[1].textvalue), *mem->gettensor<int32_t>(this->returns[0].textvalue));
+                break;
+            case Precision::Int32:
+                tensorfunc::sub<Author, int32_t>(*mem->gettensor<int32_t>(this->args[0].textvalue), *mem->gettensor<int32_t>(this->args[1].textvalue), *mem->gettensor<int32_t>(this->returns[0].textvalue));
+                break;
+            case Precision::Int16:
+                tensorfunc::sub<Author, int16_t>(*mem->gettensor<int16_t>(this->args[0].textvalue), *mem->gettensor<int16_t>(this->args[1].textvalue), *mem->gettensor<int16_t>(this->returns[0].textvalue));
+                break;
+            case Precision::Int8:
+                tensorfunc::sub<Author, int8_t>(*mem->gettensor<int8_t>(this->args[0].textvalue), *mem->gettensor<int8_t>(this->args[1].textvalue), *mem->gettensor<int8_t>(this->returns[0].textvalue));
+                break;
+            default:
+                error = "Unsupported dtype: " + precision_str(a_type);
+                return 1;
             }
             return 0;
         }
-        
     };
-    
 
+    template <typename Author>
+    class SubScalar : public TF
+    {
+    public:
+        SubScalar(vector<Param> args, vector<Param> returns)
+        {
+            this->name = "subscalar";
+            this->author = Author::name();
+            this->args = args;
+            this->returns = returns;
+        }
+        string math_formula() const override
+        {
+            return "T3=T1-scalar";
+        }
+        shared_ptr<TF> clone() const override
+        {
+            return make_shared<SubScalar<Author>>(*this);
+        }
+        int run(shared_ptr<MemBase> mem, string &error) override
+        {
+            Precision a_type = mem->gettensor(this->args[0].textvalue).get()->shape.dtype;
+            Precision c_type = mem->gettensor(this->returns[0].textvalue).get()->shape.dtype;
+            if (a_type != c_type)
+            {
+                error = "Type mismatch: " + precision_str(a_type) + " != " + precision_str(c_type);
+                return 1;
+            }
+            switch (a_type)
+            {
+            case Precision::Float64:
+                tensorfunc::subscalar<Author, double>(*mem->gettensor<double>(this->args[0].textvalue), this->getvar<double>(1, mem), *mem->gettensor<double>(this->returns[0].textvalue));
+                break;
+            case Precision::Float32:
+                tensorfunc::subscalar<Author, float>(*mem->gettensor<float>(this->args[0].textvalue), this->getvar<float>(1, mem), *mem->gettensor<float>(this->returns[0].textvalue));
+                break;
+            case Precision::Int64:
+                tensorfunc::subscalar<Author, int32_t>(*mem->gettensor<int32_t>(this->args[0].textvalue), this->getvar<int32_t>(1, mem), *mem->gettensor<int32_t>(this->returns[0].textvalue));
+                break;
+            case Precision::Int32:
+                tensorfunc::subscalar<Author, int32_t>(*mem->gettensor<int32_t>(this->args[0].textvalue), this->getvar<int32_t>(1, mem), *mem->gettensor<int32_t>(this->returns[0].textvalue));
+                break;
+            case Precision::Int16:
+                tensorfunc::subscalar<Author, int16_t>(*mem->gettensor<int16_t>(this->args[0].textvalue), this->getvar<int16_t>(1, mem), *mem->gettensor<int16_t>(this->returns[0].textvalue));
+                break;
+            case Precision::Int8:
+                tensorfunc::subscalar<Author, int8_t>(*mem->gettensor<int8_t>(this->args[0].textvalue), this->getvar<int8_t>(1, mem), *mem->gettensor<int8_t>(this->returns[0].textvalue));
+                break;
+            default:
+                error = "Unsupported dtype: " + precision_str(a_type);
+                return 1;
+            }
+            return 0;
+        }
+    };
 }
 
-
-
-
-
-
-
-
 #endif

From 1a92984eae9942d88c45247b68fe797925252507 Mon Sep 17 00:00:00 2001
From: miaobyte <734991033@qq.com>
Date: Wed, 26 Mar 2025 18:19:30 +0800
Subject: [PATCH 2/5] =?UTF-8?q?front:newtensor,print=20=E8=81=94=E5=90=88?=
 =?UTF-8?q?=E8=B0=83=E8=AF=95?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 .../src/deepx/tf/elementwise.hpp              | 113 ++++++++++++++++++
 1 file changed, 113 insertions(+)

diff --git a/excuter/op-mem-ompsimd/src/deepx/tf/elementwise.hpp b/excuter/op-mem-ompsimd/src/deepx/tf/elementwise.hpp
index 5487a2a7..d3342110 100644
--- a/excuter/op-mem-ompsimd/src/deepx/tf/elementwise.hpp
+++ b/excuter/op-mem-ompsimd/src/deepx/tf/elementwise.hpp
@@ -235,6 +235,119 @@ namespace deepx::tf
             return 0;
         }
     };
+
+    template <typename Author>
+    class Mul : public TF
+    {
+    public:
+        Mul(vector<Param> args, vector<Param> returns)
+        {   
+            this->name = "mul";
+            this->author = Author::name();
+            this->args = args;
+            this->returns = returns;
+        }   
+        string math_formula() const override
+        {
+            return "T3=T1*T2";
+        }
+        shared_ptr<TF> clone() const override   
+        {
+            return make_shared<Mul<Author>>(*this);
+        }
+        int run(shared_ptr<MemBase> mem, string &error) override
+        {
+            Precision a_type = mem->gettensor(this->args[0].textvalue).get()->shape.dtype;  
+            Precision b_type = mem->gettensor(this->args[1].textvalue).get()->shape.dtype;
+            Precision c_type = mem->gettensor(this->returns[0].textvalue).get()->shape.dtype;
+            if (a_type != b_type || a_type != c_type)
+            {
+                error = "Type mismatch: " + precision_str(a_type) + " != " + precision_str(b_type) + " != " + precision_str(c_type);
+                return 1;
+            }
+            switch (a_type)
+            {
+            case Precision::Float64:
+                tensorfunc::mul<Author, double>(*mem->gettensor<double>(this->args[0].textvalue), *mem->gettensor<double>(this->args[1].textvalue), *mem->gettensor<double>(this->returns[0].textvalue));
+                break;
+            case Precision::Float32:
+                tensorfunc::mul<Author, float>(*mem->gettensor<float>(this->args[0].textvalue), *mem->gettensor<float>(this->args[1].textvalue), *mem->gettensor<float>(this->returns[0].textvalue));
+                break;
+            case Precision::Int64:
+                tensorfunc::mul<Author, int32_t>(*mem->gettensor<int32_t>(this->args[0].textvalue), *mem->gettensor<int32_t>(this->args[1].textvalue), *mem->gettensor<int32_t>(this->returns[0].textvalue));
+                break;
+            case Precision::Int32:
+                tensorfunc::mul<Author, int32_t>(*mem->gettensor<int32_t>(this->args[0].textvalue), *mem->gettensor<int32_t>(this->args[1].textvalue), *mem->gettensor<int32_t>(this->returns[0].textvalue));
+                break;
+            case Precision::Int16:
+                tensorfunc::mul<Author, int16_t>(*mem->gettensor<int16_t>(this->args[0].textvalue), *mem->gettensor<int16_t>(this->args[1].textvalue), *mem->gettensor<int16_t>(this->returns[0].textvalue));
+                break;
+            case Precision::Int8:
+                tensorfunc::mul<Author, int8_t>(*mem->gettensor<int8_t>(this->args[0].textvalue), *mem->gettensor<int8_t>(this->args[1].textvalue), *mem->gettensor<int8_t>(this->returns[0].textvalue));
+                break;
+            default:
+                error = "Unsupported dtype: " + precision_str(a_type);
+                return 1;
+            }
+            return 0;
+        }
+    };  
+
+    template <typename Author>
+    class MulScalar : public TF
+    {
+    public:
+        MulScalar(vector<Param> args, vector<Param> returns)
+        {
+            this->name = "mulscalar";
+            this->author = Author::name();
+            this->args = args;
+            this->returns = returns;
+        }
+        string math_formula() const override
+        {
+            return "T3=T1*scalar";
+        }
+        shared_ptr<TF> clone() const override
+        {
+            return make_shared<MulScalar<Author>>(*this);
+        }
+        int run(shared_ptr<MemBase> mem, string &error) override
+        {
+            Precision a_type = mem->gettensor(this->args[0].textvalue).get()->shape.dtype;
+            Precision c_type = mem->gettensor(this->returns[0].textvalue).get()->shape.dtype;
+            if (a_type != c_type)
+            {
+                error = "Type mismatch: " + precision_str(a_type) + " != " + precision_str(c_type);
+                return 1;
+            }
+            switch (a_type)
+            {
+            case Precision::Float64:
+                tensorfunc::mulscalar<Author, double>(*mem->gettensor<double>(this->args[0].textvalue), this->getvar<double>(1, mem), *mem->gettensor<double>(this->returns[0].textvalue));
+                break;
+            case Precision::Float32:
+                tensorfunc::mulscalar<Author, float>(*mem->gettensor<float>(this->args[0].textvalue), this->getvar<float>(1, mem), *mem->gettensor<float>(this->returns[0].textvalue));
+                break;
+            case Precision::Int64:
+                tensorfunc::mulscalar<Author, int32_t>(*mem->gettensor<int32_t>(this->args[0].textvalue), this->getvar<int32_t>(1, mem), *mem->gettensor<int32_t>(this->returns[0].textvalue));
+                break;
+            case Precision::Int32:
+                tensorfunc::mulscalar<Author, int32_t>(*mem->gettensor<int32_t>(this->args[0].textvalue), this->getvar<int32_t>(1, mem), *mem->gettensor<int32_t>(this->returns[0].textvalue));
+                break;
+            case Precision::Int16:
+                tensorfunc::mulscalar<Author, int16_t>(*mem->gettensor<int16_t>(this->args[0].textvalue), this->getvar<int16_t>(1, mem), *mem->gettensor<int16_t>(this->returns[0].textvalue));
+                break;
+            case Precision::Int8:
+                tensorfunc::mulscalar<Author, int8_t>(*mem->gettensor<int8_t>(this->args[0].textvalue), this->getvar<int8_t>(1, mem), *mem->gettensor<int8_t>(this->returns[0].textvalue));
+                break;
+            default:
+                error = "Unsupported dtype: " + precision_str(a_type);
+                return 1;
+            }   
+            return 0;
+        }       
+    };              
 }
 
 #endif

From 640d3cf5950b811a1720e8520eac4308b2dc6cb1 Mon Sep 17 00:00:00 2001
From: miaobyte <734991033@qq.com>
Date: Wed, 26 Mar 2025 18:20:00 +0800
Subject: [PATCH 3/5] =?UTF-8?q?front:newtensor,print=20=E8=81=94=E5=90=88?=
 =?UTF-8?q?=E8=B0=83=E8=AF=95?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 front/py/deepx/nn/deepxir.py          | 40 +++++++++++++++++++--------
 front/py/deepx/nn/functional/new.py   |  4 +--
 front/py/deepx/nn/functional/print.py |  4 +--
 3 files changed, 33 insertions(+), 15 deletions(-)

diff --git a/front/py/deepx/nn/deepxir.py b/front/py/deepx/nn/deepxir.py
index 6dce38ea..988afdc2 100644
--- a/front/py/deepx/nn/deepxir.py
+++ b/front/py/deepx/nn/deepxir.py
@@ -1,14 +1,36 @@
-from typing import Tuple, List, Optional
+from typing import Tuple, List, Optional,Union
 import time
 from datetime import datetime  # 添加datetime模块
 
+class Param:
+    def __init__(self, value:Optional[Union[str,int,float,list,tuple]], category:str=None,precision:str=None):
+        if isinstance(value,str):
+            self._textvalue=value
+        elif isinstance(value,int) or isinstance(value,float):
+            self._textvalue=str(value)
+        elif isinstance(value,list) or isinstance(value,tuple):
+            self._textvalue='['+' '.join(str(v) for v in value)+']'
+        else:
+            raise ValueError(f"Invalid value type: {type(value)}")
+
+        self._category=category
+        self._precision=precision
+
+    def __str__(self):
+        if self._category is not None:
+            if self._precision is not None:
+                return f"{self._category}<{self._precision}> {self._textvalue}"
+            else:
+                return f"{self._category} {self._textvalue}"
+        else:
+            return self._textvalue
+
 class DeepxIR:
     def __init__(self, 
                 name:str,
-                dtype:str,
-                args: List[str], 
-                returns: List[str],
-                author:str):
+                args: List[Param], 
+                returns: List[Param],
+                author:str=''):
         """
         初始化操作节点
         Args:
@@ -17,8 +39,7 @@ def __init__(self,
             author: tensorfunc的作者名称,如"miaobyte"
         """
  
-        self._name = name  
-        self._dtype = dtype
+        self._name = name
         self._args = args
         self._returns = returns
         self._author = author
@@ -28,10 +49,7 @@ def __init__(self,
 
     def __str__(self):
         # 函数名部分
-        if self._dtype == None or self._dtype == '':
-            parts = [self._name]
-        else:
-            parts = [f"{self._name}@{self._dtype}"]
+        parts = [self._name]
         
         # 处理输入参数部分 - 使用括号和逗号分隔
         args_parts = []
diff --git a/front/py/deepx/nn/functional/new.py b/front/py/deepx/nn/functional/new.py
index 879eda7d..1cc14dff 100644
--- a/front/py/deepx/nn/functional/new.py
+++ b/front/py/deepx/nn/functional/new.py
@@ -1,6 +1,6 @@
 from deepx.tensor import Tensor
 from deepx.autograd.graph import Graph
-from deepx.nn.deepxir import DeepxIR
+from deepx.nn.deepxir import DeepxIR,Param
 from deepx.scheduler import send
 
 def newtensor(t:Tensor,name:str=None):
@@ -8,7 +8,7 @@ def newtensor(t:Tensor,name:str=None):
     t._graph = graph
     t._node=graph.add_tensor(name,t=t)
     if t.graph.eager:
-        ir2=DeepxIR("newtensor", t.dtype, t.shape, [t._node.name])
+        ir2=DeepxIR("newtensor",[Param(t.shape)], [Param(t._node.name,category='tensor',precision=t.dtype)])
         send(ir2)
 def copytensor(t:Tensor,out:Tensor):
     graph = Graph.get_default()
diff --git a/front/py/deepx/nn/functional/print.py b/front/py/deepx/nn/functional/print.py
index b4c11fb6..2eb2bb25 100644
--- a/front/py/deepx/nn/functional/print.py
+++ b/front/py/deepx/nn/functional/print.py
@@ -4,8 +4,8 @@
 from deepx.scheduler import send
 
 OpNode.register("print")
-def printtensor(t:Tensor,format=''):
-    ir=DeepxIR("print",'', [t.node.name,format], [])
+def printtensor(t:Tensor,format='',author='miaobyte'):
+    ir=DeepxIR("print",[t.node.name,format], [],author)
     send(ir)
     return ''
 

From 73bc7ba905da6451fdfe3127102d739ca85e050c Mon Sep 17 00:00:00 2001
From: harryharrygo <harryharrygogogo@gmail.com>
Date: Thu, 20 Mar 2025 22:47:55 +0800
Subject: [PATCH 4/5] Fix build error in gcc compiler. (#5)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

In gcc/++13 compiler, it shows error:
```
dtype.hpp:8:29: error: found ‘:’ in nested-name-specifier, expected ‘::’
8 | enum class DataCategory : uint8_t
```
---
 excuter/cpp-common/src/deepx/dtype.hpp | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/excuter/cpp-common/src/deepx/dtype.hpp b/excuter/cpp-common/src/deepx/dtype.hpp
index 9b9e24e8..b93a2a7a 100644
--- a/excuter/cpp-common/src/deepx/dtype.hpp
+++ b/excuter/cpp-common/src/deepx/dtype.hpp
@@ -2,6 +2,8 @@
 #define DEEPX_DTYPE_HPP
 
 #include <string>
+#include <cstdint>
+
 namespace deepx
 {
 

From a1f68151502e5477692f0c9542956abb659bbff6 Mon Sep 17 00:00:00 2001
From: miaobyte <734991033@qq.com>
Date: Wed, 26 Mar 2025 18:54:09 +0800
Subject: [PATCH 5/5] =?UTF-8?q?front&excuter:=E8=81=94=E5=90=88=E8=B0=83?=
 =?UTF-8?q?=E8=AF=95=EF=BC=8C=E4=BF=AE=E5=A4=8Dinit=E3=80=81elementwise?=
 =?UTF-8?q?=E7=9A=84IR?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 front/py/deepx/nn/functional/elementwise.py   |  26 +--
 front/py/deepx/nn/functional/init.py          |  14 +-
 front/py/examples/2_ir/1_init_zeroones.dot    |  76 ++++-----
 .../py/examples/2_ir/1_init_zeroones.dot.svg  | 152 +++++++++---------
 4 files changed, 134 insertions(+), 134 deletions(-)

diff --git a/front/py/deepx/nn/functional/elementwise.py b/front/py/deepx/nn/functional/elementwise.py
index cd12979c..ecf3c0c3 100644
--- a/front/py/deepx/nn/functional/elementwise.py
+++ b/front/py/deepx/nn/functional/elementwise.py
@@ -1,13 +1,13 @@
 from typing import Optional, Union
 from deepx import Tensor
 from deepx.autograd import Graph,DataNode,OpNode
-from deepx.nn import DeepxIR
+from deepx.nn import DeepxIR,Param
 from deepx.scheduler import send
 from .changeshape import broadcast_shape
 def _A_elementwiseop_C(
         a:Tensor,
         op:str=None,
-        out:Union[Tensor,str]="")->Tensor:
+        out:Union[Tensor,str]="",author='miaobyte')->Tensor:
     g=a.graph
  
     opnode = g.add_op(op)
@@ -20,7 +20,7 @@ def _A_elementwiseop_C(
         outtensor=out   
     outtensor.node.add_input(opnode)
     if g.eager:
-        ir=DeepxIR(op, a.dtype, [a.node.name], [outtensor.node.name])
+        ir=DeepxIR(op, [a.node.name], [outtensor.node.name],author)
         send(ir)
     return outtensor
 
@@ -28,7 +28,7 @@ def _A_B_elementwiseop_C(
         a:Tensor,
         b: Tensor, 
         op:str=None,
-        out:Union[Tensor,str]="")->Tensor:
+        out:Union[Tensor,str]="",author='miaobyte')->Tensor:
     g=a.graph
     if g is None:
        g=b.graph
@@ -53,14 +53,14 @@ def _A_B_elementwiseop_C(
         outtensor=out   
     outtensor.node.add_input(opnode)
     if g.eager:
-        ir=DeepxIR(op, A.dtype, [A.node.name, B.node.name], [outtensor.node.name])
+        ir=DeepxIR(op, [A.node.name, B.node.name], [outtensor.node.name],author)
         send(ir)
     return outtensor
 def _A_b_elementwiseop_C(
         a:Tensor,
         b: Union[ float, int] ,
         op:str=None,
-        out:Union[Tensor,str]="")->Tensor:
+        out:Union[Tensor,str]="",author='miaobyte')->Tensor:
     g=a.graph
     opnode = g.add_op(op)
     opnode.add_input(a.node)
@@ -74,14 +74,14 @@ def _A_b_elementwiseop_C(
         outtensor=out
     outtensor.node.add_input(opnode)
     if g.eager:
-        ir=DeepxIR(op, a.dtype, [a.node.name,b], [outtensor.node.name])
+        ir=DeepxIR(op, [a.node.name,b], [outtensor.node.name],author)
         send(ir)
     return outtensor
 def _a_B_elementwiseop_C(
         a: Union[ float, int] ,
         b: Tensor,
         op:str=None,
-        out:Union[Tensor,str]="")->Tensor:
+        out:Union[Tensor,str]="",author='miaobyte')->Tensor:
     g=b.graph
     opnode = g.add_op(op)
     opnode.add_input(g.add_var("",a))
@@ -95,7 +95,7 @@ def _a_B_elementwiseop_C(
         outtensor=out
     outtensor.node.add_input(opnode)
     if g.eager:
-        ir=DeepxIR(op, b.dtype, [a,b.node.name], [outtensor.node.name])
+        ir=DeepxIR(op, [a,b.node.name], [outtensor.node.name],author)
         send(ir)
     return outtensor
 
@@ -106,7 +106,7 @@ def _a_B_elementwiseop_C(
 def add(
         a:Tensor,
         b: Optional[Union[Tensor, float, int]] = None, 
-        out:Union[Tensor,str]='')->Tensor:
+        out:Union[Tensor,str]='',author='miaobyte')->Tensor:
     if isinstance(b,Tensor):
         return _A_B_elementwiseop_C(a,b,"add",out)
     else:
@@ -120,7 +120,7 @@ def add(
 def sub(
         a:Tensor,
         b: Optional[Union[Tensor, float, int]] = None, 
-        out:Union[Tensor,str]='')->Tensor:  
+        out:Union[Tensor,str]='',author='miaobyte')->Tensor:  
     if isinstance(b,Tensor):
         return _A_B_elementwiseop_C(a,b,"sub",out)
     else:
@@ -133,7 +133,7 @@ def sub(
 def mul(
         a:Tensor,
         b: Optional[Union[Tensor, float, int]] = None, 
-        out:Union[Tensor,str]='')->Tensor:
+        out:Union[Tensor,str]='',author='miaobyte')->Tensor:
     if isinstance(b,Tensor):
         return _A_B_elementwiseop_C(a,b,"mul",out)
     else:
@@ -147,7 +147,7 @@ def mul(
 def div(
         a: Optional[Union[Tensor, float, int]] = None,
         b: Optional[Union[Tensor, float, int]] = None, 
-        out:Union[Tensor,str]='')->Tensor:
+        out:Union[Tensor,str]='',author='miaobyte')->Tensor:
     if isinstance(b,Tensor) and isinstance(a,Tensor):
         return _A_B_elementwiseop_C(a,b,"div",out)
     else:
diff --git a/front/py/deepx/nn/functional/init.py b/front/py/deepx/nn/functional/init.py
index 182e696d..bb5b8f40 100644
--- a/front/py/deepx/nn/functional/init.py
+++ b/front/py/deepx/nn/functional/init.py
@@ -3,19 +3,19 @@
 
 from deepx import Tensor
 from deepx.autograd.graph import OpNode
-from deepx.nn.deepxir import DeepxIR
+from deepx.nn.deepxir import DeepxIR,Param
 from deepx.scheduler import send
 
 OpNode.register("constant")
 
 def constant(t:Tensor, value:Optional[Union[
-    float,int]]=None) -> Tensor:
+    float,int]]=None,author='miaobyte') -> Tensor:
     opnode = t.graph.add_op("constant")
     argnode=t.graph.add_var('',value)   
     opnode.add_input(argnode)
     t.node.add_input(opnode)
     if t.graph.eager:
-        ir=DeepxIR("constant", t.dtype, [value], [t.node.name])
+        ir=DeepxIR("constant",  [Param(t.node.name, 'tensor', t.dtype),Param(value)], [],author)
         send(ir)
     return t
 
@@ -39,7 +39,7 @@ def ones(*size, dtype=None, device=None,
          name:Union[str]='')->Tensor:
     return full(*size, value=1, dtype=dtype, device=device,name=name)
 
-def arange(start=0, end=None, step=1,dtype=None, device=None,name:Union[Tensor,str]='')->Tensor:
+def arange(start=0, end=None, step=1,dtype=None, device=None,name:Union[Tensor,str]='',author='miaobyte')->Tensor:
     outtensor=None
     if isinstance(name,str):
         shape=[end-start]
@@ -49,12 +49,12 @@ def arange(start=0, end=None, step=1,dtype=None, device=None,name:Union[Tensor,s
         outtensor=name
     g=outtensor.graph
     if g.eager:
-        ir=DeepxIR("arange", outtensor.dtype, [start,step], [outtensor.node.name])
+        ir=DeepxIR("arange",  [outtensor.node.name,start,step], [],author)
         send(ir)
     return outtensor
 
 OpNode.register("uniform")
-def uniform(t:Tensor,low=0, high=1,seed:int=0)->Tensor:
+def uniform(t:Tensor,low=0, high=1,seed:int=0,author='miaobyte')->Tensor:
     if low >= high:
         raise ValueError(f"low({low})必须小于high({high})")
     if t is None:
@@ -68,7 +68,7 @@ def uniform(t:Tensor,low=0, high=1,seed:int=0)->Tensor:
         opnode.add_input(g.add_var('',seed))
     t.node.add_input(opnode)
     if t.graph.eager:
-        ir=DeepxIR("uniform", t.dtype, [low, high,seed], [t.node.name])
+        ir=DeepxIR("uniform",  [t.node.name,low, high,seed], [],author)
         send(ir)
     return t
 
diff --git a/front/py/examples/2_ir/1_init_zeroones.dot b/front/py/examples/2_ir/1_init_zeroones.dot
index a78b90cc..33d54af8 100644
--- a/front/py/examples/2_ir/1_init_zeroones.dot
+++ b/front/py/examples/2_ir/1_init_zeroones.dot
@@ -2,55 +2,55 @@
 digraph {
 	rankdir=TB
 	node [shape=record]
-	134462353640752 [label="t1
+	132815942520016 [label="t1
 (3, 4, 5)" color=skyblue fillcolor=aliceblue fontname="Sans-Serif" labeljust=l shape=box style=filled]
-	134460378946608 [label=constant color=darkslategray fillcolor=lightgray fontname="Courier Bold" labeljust=l shape=box style=filled]
-	134460378946848 [label="var_1
+	132813646230768 [label=constant color=darkslategray fillcolor=lightgray fontname="Courier Bold" labeljust=l shape=box style=filled]
+	132814271881056 [label="var_1
 0" color=orange fillcolor=moccasin fontname="Sans-Serif" labeljust=l shape=box style=filled]
-	134460377149792 [label="t2
+	132813645298272 [label="t2
 (3, 4, 5)" color=skyblue fillcolor=aliceblue fontname="Sans-Serif" labeljust=l shape=box style=filled]
-	134460377149936 [label=constant color=darkslategray fillcolor=lightgray fontname="Courier Bold" labeljust=l shape=box style=filled]
-	134460377150032 [label="var_2
+	132813645298464 [label=constant color=darkslategray fillcolor=lightgray fontname="Courier Bold" labeljust=l shape=box style=filled]
+	132813645298080 [label="var_2
 1" color=orange fillcolor=moccasin fontname="Sans-Serif" labeljust=l shape=box style=filled]
-	134460377150272 [label=add color=darkslategray fillcolor=lightgray fontname="Courier Bold" labeljust=l shape=box style=filled]
-	134460377150464 [label="t3
+	132813645298704 [label=add color=darkslategray fillcolor=lightgray fontname="Courier Bold" labeljust=l shape=box style=filled]
+	132813645298512 [label="t3
 (3, 4, 5)" color=skyblue fillcolor=aliceblue fontname="Sans-Serif" labeljust=l shape=box style=filled]
-	134460377150560 [label="t4
+	132813645298800 [label="t4
 (3, 4, 5)" color=skyblue fillcolor=aliceblue fontname="Sans-Serif" labeljust=l shape=box style=filled]
-	134460377150800 [label=constant color=darkslategray fillcolor=lightgray fontname="Courier Bold" labeljust=l shape=box style=filled]
-	134460377150752 [label="var_3
+	132813645299136 [label=constant color=darkslategray fillcolor=lightgray fontname="Courier Bold" labeljust=l shape=box style=filled]
+	132813645299088 [label="var_3
 0.5" color=orange fillcolor=moccasin fontname="Sans-Serif" labeljust=l shape=box style=filled]
-	134460377150896 [label=add color=darkslategray fillcolor=lightgray fontname="Courier Bold" labeljust=l shape=box style=filled]
-	134460377151040 [label="t5
+	132813645298944 [label=add color=darkslategray fillcolor=lightgray fontname="Courier Bold" labeljust=l shape=box style=filled]
+	132813645299424 [label="t5
 (3, 4, 5)" color=skyblue fillcolor=aliceblue fontname="Sans-Serif" labeljust=l shape=box style=filled]
-	134460377151472 [label="tensor_6
+	132813645299664 [label="tensor_6
 (3, 4, 5)" color=skyblue fillcolor=aliceblue fontname="Sans-Serif" labeljust=l shape=box style=filled]
-	134460377151568 [label=constant color=darkslategray fillcolor=lightgray fontname="Courier Bold" labeljust=l shape=box style=filled]
-	134460377151520 [label="var_4
+	132813645293616 [label=constant color=darkslategray fillcolor=lightgray fontname="Courier Bold" labeljust=l shape=box style=filled]
+	132813645293664 [label="var_4
 0" color=orange fillcolor=moccasin fontname="Sans-Serif" labeljust=l shape=box style=filled]
-	134460377151712 [label=uniform color=darkslategray fillcolor=lightgray fontname="Courier Bold" labeljust=l shape=box style=filled]
-	134460377151232 [label="var_5
+	132813645293280 [label=uniform color=darkslategray fillcolor=lightgray fontname="Courier Bold" labeljust=l shape=box style=filled]
+	132813645299616 [label="var_5
 -0.5477225575051661" color=orange fillcolor=moccasin fontname="Sans-Serif" labeljust=l shape=box style=filled]
-	134460377151904 [label="var_6
+	132813645293568 [label="var_6
 0.5477225575051661" color=orange fillcolor=moccasin fontname="Sans-Serif" labeljust=l shape=box style=filled]
-	134460377151856 [label="var_7
+	132813645293424 [label="var_7
 0" color=orange fillcolor=moccasin fontname="Sans-Serif" labeljust=l shape=box style=filled]
-	134460378946608 -> 134462353640752 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	134460378946848 -> 134460378946608 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	134460377149936 -> 134460377149792 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	134460377150032 -> 134460377149936 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	134462353640752 -> 134460377150272 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	134460377149792 -> 134460377150272 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	134460377150272 -> 134460377150464 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	134460377150800 -> 134460377150560 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	134460377150752 -> 134460377150800 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	134460377150560 -> 134460377150896 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	134460377150464 -> 134460377150896 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	134460377150896 -> 134460377151040 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	134460377151568 -> 134460377151472 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	134460377151712 -> 134460377151472 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	134460377151520 -> 134460377151568 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	134460377151232 -> 134460377151712 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	134460377151904 -> 134460377151712 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	134460377151856 -> 134460377151712 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	132813646230768 -> 132815942520016 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	132814271881056 -> 132813646230768 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	132813645298464 -> 132813645298272 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	132813645298080 -> 132813645298464 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	132815942520016 -> 132813645298704 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	132813645298272 -> 132813645298704 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	132813645298704 -> 132813645298512 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	132813645299136 -> 132813645298800 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	132813645299088 -> 132813645299136 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	132813645298800 -> 132813645298944 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	132813645298512 -> 132813645298944 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	132813645298944 -> 132813645299424 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	132813645293616 -> 132813645299664 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	132813645293280 -> 132813645299664 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	132813645293664 -> 132813645293616 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	132813645299616 -> 132813645293280 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	132813645293568 -> 132813645293280 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	132813645293424 -> 132813645293280 [arrowsize=0.8 color=gray40 penwidth=1.2]
 }
diff --git a/front/py/examples/2_ir/1_init_zeroones.dot.svg b/front/py/examples/2_ir/1_init_zeroones.dot.svg
index ffd2506d..474bbbd8 100644
--- a/front/py/examples/2_ir/1_init_zeroones.dot.svg
+++ b/front/py/examples/2_ir/1_init_zeroones.dot.svg
@@ -9,244 +9,244 @@
 <g id="graph0" class="graph" transform="scale(1 1) rotate(0) translate(4 480)">
 <title>%3</title>
 <polygon fill="white" stroke="transparent" points="-4,4 -4,-480 731.5,-480 731.5,4 -4,4"/>
-<!-- 134462353640752 -->
+<!-- 132815942520016 -->
 <g id="node1" class="node">
-<title>134462353640752</title>
+<title>132815942520016</title>
 <polygon fill="aliceblue" stroke="skyblue" points="239.5,-330 177.5,-330 177.5,-292 239.5,-292 239.5,-330"/>
 <text text-anchor="middle" x="208.5" y="-314.8" font-family="Sans-Serif" font-size="14.00">t1</text>
 <text text-anchor="middle" x="208.5" y="-299.8" font-family="Sans-Serif" font-size="14.00">(3, 4, 5)</text>
 </g>
-<!-- 134460377150272 -->
+<!-- 132813645298704 -->
 <g id="node7" class="node">
-<title>134460377150272</title>
+<title>132813645298704</title>
 <polygon fill="lightgray" stroke="darkslategray" points="155.5,-256 101.5,-256 101.5,-220 155.5,-220 155.5,-256"/>
 <text text-anchor="middle" x="128.5" y="-234.3" font-family="Courier Bold" font-size="14.00">add</text>
 </g>
-<!-- 134462353640752&#45;&gt;134460377150272 -->
+<!-- 132815942520016&#45;&gt;132813645298704 -->
 <g id="edge5" class="edge">
-<title>134462353640752&#45;&gt;134460377150272</title>
+<title>132815942520016&#45;&gt;132813645298704</title>
 <path fill="none" stroke="#666666" stroke-width="1.2" d="M187.9,-291.72C177.53,-282.51 164.86,-271.27 153.89,-261.53"/>
 <polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="155.5,-259.22 147.66,-256 151.78,-263.41 155.5,-259.22"/>
 </g>
-<!-- 134460378946608 -->
+<!-- 132813646230768 -->
 <g id="node2" class="node">
-<title>134460378946608</title>
+<title>132813646230768</title>
 <polygon fill="lightgray" stroke="darkslategray" points="260,-402 177,-402 177,-366 260,-366 260,-402"/>
 <text text-anchor="middle" x="218.5" y="-380.3" font-family="Courier Bold" font-size="14.00">constant</text>
 </g>
-<!-- 134460378946608&#45;&gt;134462353640752 -->
+<!-- 132813646230768&#45;&gt;132815942520016 -->
 <g id="edge1" class="edge">
-<title>134460378946608&#45;&gt;134462353640752</title>
+<title>132813646230768&#45;&gt;132815942520016</title>
 <path fill="none" stroke="#666666" stroke-width="1.2" d="M216.08,-365.81C214.91,-357.52 213.48,-347.39 212.18,-338.16"/>
 <polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="214.93,-337.55 211.04,-330.02 209.38,-338.33 214.93,-337.55"/>
 </g>
-<!-- 134460378946848 -->
+<!-- 132814271881056 -->
 <g id="node3" class="node">
-<title>134460378946848</title>
+<title>132814271881056</title>
 <polygon fill="moccasin" stroke="orange" points="245.5,-476 191.5,-476 191.5,-438 245.5,-438 245.5,-476"/>
 <text text-anchor="middle" x="218.5" y="-460.8" font-family="Sans-Serif" font-size="14.00">var_1</text>
 <text text-anchor="middle" x="218.5" y="-445.8" font-family="Sans-Serif" font-size="14.00">0</text>
 </g>
-<!-- 134460378946848&#45;&gt;134460378946608 -->
+<!-- 132814271881056&#45;&gt;132813646230768 -->
 <g id="edge2" class="edge">
-<title>134460378946848&#45;&gt;134460378946608</title>
+<title>132814271881056&#45;&gt;132813646230768</title>
 <path fill="none" stroke="#666666" stroke-width="1.2" d="M218.5,-437.72C218.5,-429.29 218.5,-419.15 218.5,-410.02"/>
 <polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="221.3,-410 218.5,-402 215.7,-410 221.3,-410"/>
 </g>
-<!-- 134460377149792 -->
+<!-- 132813645298272 -->
 <g id="node4" class="node">
-<title>134460377149792</title>
+<title>132813645298272</title>
 <polygon fill="aliceblue" stroke="skyblue" points="153.5,-330 91.5,-330 91.5,-292 153.5,-292 153.5,-330"/>
 <text text-anchor="middle" x="122.5" y="-314.8" font-family="Sans-Serif" font-size="14.00">t2</text>
 <text text-anchor="middle" x="122.5" y="-299.8" font-family="Sans-Serif" font-size="14.00">(3, 4, 5)</text>
 </g>
-<!-- 134460377149792&#45;&gt;134460377150272 -->
+<!-- 132813645298272&#45;&gt;132813645298704 -->
 <g id="edge6" class="edge">
-<title>134460377149792&#45;&gt;134460377150272</title>
+<title>132813645298272&#45;&gt;132813645298704</title>
 <path fill="none" stroke="#666666" stroke-width="1.2" d="M124.05,-291.72C124.76,-283.29 125.61,-273.15 126.39,-264.02"/>
 <polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="129.18,-264.21 127.06,-256 123.6,-263.74 129.18,-264.21"/>
 </g>
-<!-- 134460377149936 -->
+<!-- 132813645298464 -->
 <g id="node5" class="node">
-<title>134460377149936</title>
+<title>132813645298464</title>
 <polygon fill="lightgray" stroke="darkslategray" points="159,-402 76,-402 76,-366 159,-366 159,-402"/>
 <text text-anchor="middle" x="117.5" y="-380.3" font-family="Courier Bold" font-size="14.00">constant</text>
 </g>
-<!-- 134460377149936&#45;&gt;134460377149792 -->
+<!-- 132813645298464&#45;&gt;132813645298272 -->
 <g id="edge3" class="edge">
-<title>134460377149936&#45;&gt;134460377149792</title>
+<title>132813645298464&#45;&gt;132813645298272</title>
 <path fill="none" stroke="#666666" stroke-width="1.2" d="M118.71,-365.81C119.29,-357.52 120.01,-347.39 120.66,-338.16"/>
 <polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="123.46,-338.2 121.23,-330.02 117.88,-337.8 123.46,-338.2"/>
 </g>
-<!-- 134460377150032 -->
+<!-- 132813645298080 -->
 <g id="node6" class="node">
-<title>134460377150032</title>
+<title>132813645298080</title>
 <polygon fill="moccasin" stroke="orange" points="144.5,-476 90.5,-476 90.5,-438 144.5,-438 144.5,-476"/>
 <text text-anchor="middle" x="117.5" y="-460.8" font-family="Sans-Serif" font-size="14.00">var_2</text>
 <text text-anchor="middle" x="117.5" y="-445.8" font-family="Sans-Serif" font-size="14.00">1</text>
 </g>
-<!-- 134460377150032&#45;&gt;134460377149936 -->
+<!-- 132813645298080&#45;&gt;132813645298464 -->
 <g id="edge4" class="edge">
-<title>134460377150032&#45;&gt;134460377149936</title>
+<title>132813645298080&#45;&gt;132813645298464</title>
 <path fill="none" stroke="#666666" stroke-width="1.2" d="M117.5,-437.72C117.5,-429.29 117.5,-419.15 117.5,-410.02"/>
 <polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="120.3,-410 117.5,-402 114.7,-410 120.3,-410"/>
 </g>
-<!-- 134460377150464 -->
+<!-- 132813645298512 -->
 <g id="node8" class="node">
-<title>134460377150464</title>
+<title>132813645298512</title>
 <polygon fill="aliceblue" stroke="skyblue" points="157.5,-184 95.5,-184 95.5,-146 157.5,-146 157.5,-184"/>
 <text text-anchor="middle" x="126.5" y="-168.8" font-family="Sans-Serif" font-size="14.00">t3</text>
 <text text-anchor="middle" x="126.5" y="-153.8" font-family="Sans-Serif" font-size="14.00">(3, 4, 5)</text>
 </g>
-<!-- 134460377150272&#45;&gt;134460377150464 -->
+<!-- 132813645298704&#45;&gt;132813645298512 -->
 <g id="edge7" class="edge">
-<title>134460377150272&#45;&gt;134460377150464</title>
+<title>132813645298704&#45;&gt;132813645298512</title>
 <path fill="none" stroke="#666666" stroke-width="1.2" d="M128.02,-219.81C127.78,-211.52 127.5,-201.39 127.24,-192.16"/>
 <polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="130.03,-191.94 127.01,-184.02 124.43,-192.1 130.03,-191.94"/>
 </g>
-<!-- 134460377150896 -->
+<!-- 132813645298944 -->
 <g id="node12" class="node">
-<title>134460377150896</title>
+<title>132813645298944</title>
 <polygon fill="lightgray" stroke="darkslategray" points="111.5,-110 57.5,-110 57.5,-74 111.5,-74 111.5,-110"/>
 <text text-anchor="middle" x="84.5" y="-88.3" font-family="Courier Bold" font-size="14.00">add</text>
 </g>
-<!-- 134460377150464&#45;&gt;134460377150896 -->
+<!-- 132813645298512&#45;&gt;132813645298944 -->
 <g id="edge11" class="edge">
-<title>134460377150464&#45;&gt;134460377150896</title>
+<title>132813645298512&#45;&gt;132813645298944</title>
 <path fill="none" stroke="#666666" stroke-width="1.2" d="M115.68,-145.72C110.49,-136.94 104.21,-126.31 98.64,-116.91"/>
 <polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="101.04,-115.46 94.56,-110 96.22,-118.31 101.04,-115.46"/>
 </g>
-<!-- 134460377150560 -->
+<!-- 132813645298800 -->
 <g id="node9" class="node">
-<title>134460377150560</title>
+<title>132813645298800</title>
 <polygon fill="aliceblue" stroke="skyblue" points="75.5,-184 13.5,-184 13.5,-146 75.5,-146 75.5,-184"/>
 <text text-anchor="middle" x="44.5" y="-168.8" font-family="Sans-Serif" font-size="14.00">t4</text>
 <text text-anchor="middle" x="44.5" y="-153.8" font-family="Sans-Serif" font-size="14.00">(3, 4, 5)</text>
 </g>
-<!-- 134460377150560&#45;&gt;134460377150896 -->
+<!-- 132813645298800&#45;&gt;132813645298944 -->
 <g id="edge10" class="edge">
-<title>134460377150560&#45;&gt;134460377150896</title>
+<title>132813645298800&#45;&gt;132813645298944</title>
 <path fill="none" stroke="#666666" stroke-width="1.2" d="M54.8,-145.72C59.7,-137.03 65.61,-126.52 70.87,-117.19"/>
 <polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="73.43,-118.35 74.92,-110 68.55,-115.6 73.43,-118.35"/>
 </g>
-<!-- 134460377150800 -->
+<!-- 132813645299136 -->
 <g id="node10" class="node">
-<title>134460377150800</title>
+<title>132813645299136</title>
 <polygon fill="lightgray" stroke="darkslategray" points="83,-256 0,-256 0,-220 83,-220 83,-256"/>
 <text text-anchor="middle" x="41.5" y="-234.3" font-family="Courier Bold" font-size="14.00">constant</text>
 </g>
-<!-- 134460377150800&#45;&gt;134460377150560 -->
+<!-- 132813645299136&#45;&gt;132813645298800 -->
 <g id="edge8" class="edge">
-<title>134460377150800&#45;&gt;134460377150560</title>
+<title>132813645299136&#45;&gt;132813645298800</title>
 <path fill="none" stroke="#666666" stroke-width="1.2" d="M42.23,-219.81C42.58,-211.52 43,-201.39 43.39,-192.16"/>
 <polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="46.2,-192.13 43.74,-184.02 40.6,-191.89 46.2,-192.13"/>
 </g>
-<!-- 134460377150752 -->
+<!-- 132813645299088 -->
 <g id="node11" class="node">
-<title>134460377150752</title>
+<title>132813645299088</title>
 <polygon fill="moccasin" stroke="orange" points="68.5,-330 14.5,-330 14.5,-292 68.5,-292 68.5,-330"/>
 <text text-anchor="middle" x="41.5" y="-314.8" font-family="Sans-Serif" font-size="14.00">var_3</text>
 <text text-anchor="middle" x="41.5" y="-299.8" font-family="Sans-Serif" font-size="14.00">0.5</text>
 </g>
-<!-- 134460377150752&#45;&gt;134460377150800 -->
+<!-- 132813645299088&#45;&gt;132813645299136 -->
 <g id="edge9" class="edge">
-<title>134460377150752&#45;&gt;134460377150800</title>
+<title>132813645299088&#45;&gt;132813645299136</title>
 <path fill="none" stroke="#666666" stroke-width="1.2" d="M41.5,-291.72C41.5,-283.29 41.5,-273.15 41.5,-264.02"/>
 <polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="44.3,-264 41.5,-256 38.7,-264 44.3,-264"/>
 </g>
-<!-- 134460377151040 -->
+<!-- 132813645299424 -->
 <g id="node13" class="node">
-<title>134460377151040</title>
+<title>132813645299424</title>
 <polygon fill="aliceblue" stroke="skyblue" points="115.5,-38 53.5,-38 53.5,0 115.5,0 115.5,-38"/>
 <text text-anchor="middle" x="84.5" y="-22.8" font-family="Sans-Serif" font-size="14.00">t5</text>
 <text text-anchor="middle" x="84.5" y="-7.8" font-family="Sans-Serif" font-size="14.00">(3, 4, 5)</text>
 </g>
-<!-- 134460377150896&#45;&gt;134460377151040 -->
+<!-- 132813645298944&#45;&gt;132813645299424 -->
 <g id="edge12" class="edge">
-<title>134460377150896&#45;&gt;134460377151040</title>
+<title>132813645298944&#45;&gt;132813645299424</title>
 <path fill="none" stroke="#666666" stroke-width="1.2" d="M84.5,-73.81C84.5,-65.52 84.5,-55.39 84.5,-46.16"/>
 <polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="87.3,-46.02 84.5,-38.02 81.7,-46.02 87.3,-46.02"/>
 </g>
-<!-- 134460377151472 -->
+<!-- 132813645299664 -->
 <g id="node14" class="node">
-<title>134460377151472</title>
+<title>132813645299664</title>
 <polygon fill="aliceblue" stroke="skyblue" points="507,-330 434,-330 434,-292 507,-292 507,-330"/>
 <text text-anchor="middle" x="470.5" y="-314.8" font-family="Sans-Serif" font-size="14.00">tensor_6</text>
 <text text-anchor="middle" x="470.5" y="-299.8" font-family="Sans-Serif" font-size="14.00">(3, 4, 5)</text>
 </g>
-<!-- 134460377151568 -->
+<!-- 132813645293616 -->
 <g id="node15" class="node">
-<title>134460377151568</title>
+<title>132813645293616</title>
 <polygon fill="lightgray" stroke="darkslategray" points="443,-402 360,-402 360,-366 443,-366 443,-402"/>
 <text text-anchor="middle" x="401.5" y="-380.3" font-family="Courier Bold" font-size="14.00">constant</text>
 </g>
-<!-- 134460377151568&#45;&gt;134460377151472 -->
+<!-- 132813645293616&#45;&gt;132813645299664 -->
 <g id="edge13" class="edge">
-<title>134460377151568&#45;&gt;134460377151472</title>
+<title>132813645293616&#45;&gt;132813645299664</title>
 <path fill="none" stroke="#666666" stroke-width="1.2" d="M418.2,-365.81C426.92,-356.84 437.73,-345.72 447.25,-335.92"/>
 <polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="449.42,-337.71 452.99,-330.02 445.4,-333.81 449.42,-337.71"/>
 </g>
-<!-- 134460377151520 -->
+<!-- 132813645293664 -->
 <g id="node16" class="node">
-<title>134460377151520</title>
+<title>132813645293664</title>
 <polygon fill="moccasin" stroke="orange" points="319.5,-476 265.5,-476 265.5,-438 319.5,-438 319.5,-476"/>
 <text text-anchor="middle" x="292.5" y="-460.8" font-family="Sans-Serif" font-size="14.00">var_4</text>
 <text text-anchor="middle" x="292.5" y="-445.8" font-family="Sans-Serif" font-size="14.00">0</text>
 </g>
-<!-- 134460377151520&#45;&gt;134460377151568 -->
+<!-- 132813645293664&#45;&gt;132813645293616 -->
 <g id="edge15" class="edge">
-<title>134460377151520&#45;&gt;134460377151568</title>
+<title>132813645293664&#45;&gt;132813645293616</title>
 <path fill="none" stroke="#666666" stroke-width="1.2" d="M319.72,-438.27C334.49,-428.65 352.85,-416.69 368.43,-406.54"/>
 <polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="370.2,-408.73 375.37,-402.02 367.14,-404.04 370.2,-408.73"/>
 </g>
-<!-- 134460377151712 -->
+<!-- 132813645293280 -->
 <g id="node17" class="node">
-<title>134460377151712</title>
+<title>132813645293280</title>
 <polygon fill="lightgray" stroke="darkslategray" points="576.5,-402 502.5,-402 502.5,-366 576.5,-366 576.5,-402"/>
 <text text-anchor="middle" x="539.5" y="-380.3" font-family="Courier Bold" font-size="14.00">uniform</text>
 </g>
-<!-- 134460377151712&#45;&gt;134460377151472 -->
+<!-- 132813645293280&#45;&gt;132813645299664 -->
 <g id="edge14" class="edge">
-<title>134460377151712&#45;&gt;134460377151472</title>
+<title>132813645293280&#45;&gt;132813645299664</title>
 <path fill="none" stroke="#666666" stroke-width="1.2" d="M522.8,-365.81C514.08,-356.84 503.27,-345.72 493.75,-335.92"/>
 <polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="495.6,-333.81 488.01,-330.02 491.58,-337.71 495.6,-333.81"/>
 </g>
-<!-- 134460377151232 -->
+<!-- 132813645299616 -->
 <g id="node18" class="node">
-<title>134460377151232</title>
+<title>132813645299616</title>
 <polygon fill="moccasin" stroke="orange" points="489.5,-476 337.5,-476 337.5,-438 489.5,-438 489.5,-476"/>
 <text text-anchor="middle" x="413.5" y="-460.8" font-family="Sans-Serif" font-size="14.00">var_5</text>
 <text text-anchor="middle" x="413.5" y="-445.8" font-family="Sans-Serif" font-size="14.00">&#45;0.5477225575051661</text>
 </g>
-<!-- 134460377151232&#45;&gt;134460377151712 -->
+<!-- 132813645299616&#45;&gt;132813645293280 -->
 <g id="edge16" class="edge">
-<title>134460377151232&#45;&gt;134460377151712</title>
+<title>132813645299616&#45;&gt;132813645293280</title>
 <path fill="none" stroke="#666666" stroke-width="1.2" d="M445.62,-437.9C462.72,-428.27 483.85,-416.36 501.73,-406.28"/>
 <polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="503.58,-408.46 509.17,-402.09 500.83,-403.58 503.58,-408.46"/>
 </g>
-<!-- 134460377151904 -->
+<!-- 132813645293568 -->
 <g id="node19" class="node">
-<title>134460377151904</title>
+<title>132813645293568</title>
 <polygon fill="moccasin" stroke="orange" points="655.5,-476 507.5,-476 507.5,-438 655.5,-438 655.5,-476"/>
 <text text-anchor="middle" x="581.5" y="-460.8" font-family="Sans-Serif" font-size="14.00">var_6</text>
 <text text-anchor="middle" x="581.5" y="-445.8" font-family="Sans-Serif" font-size="14.00">0.5477225575051661</text>
 </g>
-<!-- 134460377151904&#45;&gt;134460377151712 -->
+<!-- 132813645293568&#45;&gt;132813645293280 -->
 <g id="edge17" class="edge">
-<title>134460377151904&#45;&gt;134460377151712</title>
+<title>132813645293568&#45;&gt;132813645293280</title>
 <path fill="none" stroke="#666666" stroke-width="1.2" d="M570.68,-437.72C565.49,-428.94 559.21,-418.31 553.64,-408.91"/>
 <polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="556.04,-407.46 549.56,-402 551.22,-410.31 556.04,-407.46"/>
 </g>
-<!-- 134460377151856 -->
+<!-- 132813645293424 -->
 <g id="node20" class="node">
-<title>134460377151856</title>
+<title>132813645293424</title>
 <polygon fill="moccasin" stroke="orange" points="727.5,-476 673.5,-476 673.5,-438 727.5,-438 727.5,-476"/>
 <text text-anchor="middle" x="700.5" y="-460.8" font-family="Sans-Serif" font-size="14.00">var_7</text>
 <text text-anchor="middle" x="700.5" y="-445.8" font-family="Sans-Serif" font-size="14.00">0</text>
 </g>
-<!-- 134460377151856&#45;&gt;134460377151712 -->
+<!-- 132813645293424&#45;&gt;132813645293280 -->
 <g id="edge18" class="edge">
-<title>134460377151856&#45;&gt;134460377151712</title>
+<title>132813645293424&#45;&gt;132813645293280</title>
 <path fill="none" stroke="#666666" stroke-width="1.2" d="M673.46,-442.25C670.45,-440.79 667.42,-439.35 664.5,-438 638.14,-425.84 608.21,-413.11 584.24,-403.17"/>
 <polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="585.15,-400.52 576.69,-400.05 583.01,-405.69 585.15,-400.52"/>
 </g>