diff --git a/doc/excuter/op-mem-ompsimd/list.md b/doc/excuter/op-mem-ompsimd/list.md
index f018d192..c9d51f4f 100644
--- a/doc/excuter/op-mem-ompsimd/list.md
+++ b/doc/excuter/op-mem-ompsimd/list.md
@@ -4,6 +4,7 @@
 
 | Operation | Author | Func Def | Math Formula | IR Instruction |
 |-----------|--------|------------|--------------|----------------|
+| reducemax | miaobyte | reducemax(tensor<any> A, vector<int32> axis, var<bool> keepdims)->(tensor<any> B) | B = reducemax(A, axis=[1 2], keepdims=false) | reducemax(tensor<any> A, vector<int32> axis, var<bool> keepdims)->(tensor<any> B) |
 | broadcastTo | miaobyte | broadcastTo(tensor<any> A, vector<int32> new_shape)->(tensor<any> B) | T2 = T1.broadcastTo(new_shape=[4,3,2]) | broadcastTo(tensor<any> A, vector<int32> new_shape)->(tensor<any> B) |
 | concat | miaobyte | concat(listtensor<any> tensors, var<int32> axis)->(tensor<any> result) | Tresult = concat([T1, T2...], axis=3) | concat(listtensor<any> tensors, var<int32> axis)->(tensor<any> result) |
 | transpose | miaobyte | transpose(tensor<any> A, vector<int32> dim_order)->(tensor<any> C) | T1.transpose(dimorder=[1,0])->T2 | transpose(tensor<any> A, vector<int32> dim_order)->(tensor<any> C) |
@@ -21,8 +22,10 @@
 | newtensor |  none  | newtensor(vector<int32> shape)->(tensor<any> tensor1) | T1 =Tensor(shape=[...]) | newtensor(vector<int32> shape)->(tensor<any> tensor1) |
 | newtensor |  none  | newtensor(var<string> shape)->(tensor<any> tensor1) | T1 =Tensor(shape=[...]) | newtensor(var<string> shape)->(tensor<any> tensor1) |
 | vecset |  none  | vecset(vector<any> value)->(vector<any> name) | shape = [3  4  5] | vecset(vector<any> value)->(vector<any> name) |
+| reducemin | miaobyte | reducemin(tensor<any> A, vector<int32> axis, var<bool> keepdims)->(tensor<any> B) | B = reducemin(A, axis=[1 2], keepdims=false) | reducemin(tensor<any> A, vector<int32> axis, var<bool> keepdims)->(tensor<any> B) |
 | subscalar | miaobyte | subscalar(tensor<any> a, var<any> scalar)->(tensor<any> c) | T3=T1-scalar | subscalar(tensor<any> a, var<any> scalar)->(tensor<any> c) |
 | sqrt | miaobyte | sqrt(tensor<any> A)->(tensor<any> C) | T3=sqrt(T1) | sqrt(tensor<any> A)->(tensor<any> C) |
+| sum | miaobyte | sum(tensor<any> A, vector<int32> axis, var<bool> keepdims)->(tensor<any> B) | B = sum(A, axis=[1 2], keepdims=false) | sum(tensor<any> A, vector<int32> axis, var<bool> keepdims)->(tensor<any> B) |
 | argset |  none  | argset(var<any> value)->(var<any> name) | var argname = argvalue | argset(var<any> value)->(var<any> name) |
 | sub | miaobyte | sub(tensor<any> a, tensor<any> b)->(tensor<any> c) | T3=T1-T2 | sub(tensor<any> a, tensor<any> b)->(tensor<any> c) |
 | mulscalar | miaobyte | mulscalar(tensor<any> A, var<any> b)->(tensor<any> C) | T3=T1*scalar | mulscalar(tensor<any> A, var<any> b)->(tensor<any> C) |
@@ -36,6 +39,7 @@
 | exp | miaobyte | exp(tensor<any> A)->(tensor<any> C) | T3=exp(T1) | exp(tensor<any> A)->(tensor<any> C) |
 | rdivscalar | miaobyte | rdivscalar(var<any> scalar, tensor<any> A)->(tensor<any> C) | T3=scalar/T1 | rdivscalar(var<any> scalar, tensor<any> A)->(tensor<any> C) |
 | minscalar | miaobyte | minscalar(tensor<any> A, var<any> scalar)->(tensor<any> C) | T3=min(T1,scalar) | minscalar(tensor<any> A, var<any> scalar)->(tensor<any> C) |
+| prod | miaobyte | prod(tensor<any> A, vector<int32> axis, var<bool> keepdims)->(tensor<any> B) | B = prod(A, axis=[1 2], keepdims=false) | prod(tensor<any> A, vector<int32> axis, var<bool> keepdims)->(tensor<any> B) |
 | min | miaobyte | min(tensor<any> A, tensor<any> B)->(tensor<any> C) | T3=min(T1,T2) | min(tensor<any> A, tensor<any> B)->(tensor<any> C) |
 | compare | miaobyte | compare(tensor<any> A, tensor<any> B)->(tensor<float32> mask) | mask=compare(T1,T2) | compare(tensor<any> A, tensor<any> B)->(tensor<float32> mask) |
 | matmul | cblas | matmul(tensor<float64|float32> A, tensor<float64|float32> B)->(tensor<float64|float32> C) | T3=T1 @ T2 | matmul(tensor<float64|float32> A, tensor<float64|float32> B)->(tensor<float64|float32> C) |
diff --git a/excuter/cpp-common/src/deepx/shape_broadcast.hpp b/excuter/cpp-common/src/deepx/shape_broadcast.hpp
deleted file mode 100644
index 290eb632..00000000
--- a/excuter/cpp-common/src/deepx/shape_broadcast.hpp
+++ /dev/null
@@ -1,21 +0,0 @@
-#ifndef DEEPX_OP_CPU_SHAPE_HPP
-#define DEEPX_OP_CPU_SHAPE_HPP
-
-
-#include "deepx/tensor.hpp"
-
-
-namespace deepx  {
-    
-    std::vector<int> broadcastShape(const std::vector<int> &a, const std::vector<int> &b);
-    enum BroadcastMap
-    {
-        xTox = 0,
-        nullTo1 = 1,
-        xTo1 = 2,
-    };
-    std::vector<BroadcastMap> broadcastMap(const std::vector<int> &a, const std::vector<int> &b);
-
-}
-
-#endif // DEEPX_OP_CPU_SHAPE_HPP
\ No newline at end of file
diff --git a/excuter/cpp-common/src/deepx/shape_broadcast.cpp b/excuter/cpp-common/src/deepx/shape_changeshape.cpp
similarity index 54%
rename from excuter/cpp-common/src/deepx/shape_broadcast.cpp
rename to excuter/cpp-common/src/deepx/shape_changeshape.cpp
index 75ee5575..17a89461 100644
--- a/excuter/cpp-common/src/deepx/shape_broadcast.cpp
+++ b/excuter/cpp-common/src/deepx/shape_changeshape.cpp
@@ -1,11 +1,60 @@
 #include <vector>
 #include <stdexcept>
 
-#include "deepx/shape_broadcast.hpp"
+#include "deepx/shape_changeshape.hpp"
 
 namespace deepx 
 {
-   
+    //transpose
+
+        std::vector<int> swaplastTwoDimOrder(const std::vector<int> &shape) 
+    {
+        vector<int> dimOrder = shape;
+        std::iota(dimOrder.begin(), dimOrder.end(), 0);
+        swap(dimOrder[dimOrder.size() - 1], dimOrder[dimOrder.size() - 2]);
+        return dimOrder;
+    }
+    std::vector<int> transposeShape(const std::vector<int> &shape, const std::vector<int> &dimOrder) 
+    {
+        if (dimOrder.size() != shape.size())
+        {
+            throw std::invalid_argument("dimOrder size does not match the number of dimensions in the TensorCPU.");
+        }
+        std::vector<int> newShape = shape;
+        for (size_t i = 0; i < dimOrder.size(); ++i)
+        {
+            newShape[i] =shape[dimOrder[i]];
+        }
+        return newShape;
+    }
+
+    //concat
+
+    Shape concatShape(const std::vector<Shape> &shapes,const int axis){
+        std::vector<int> outputShape(shapes[0].dim);
+        outputShape=shapes[0].shape;
+        for (int i = 1; i < shapes.size(); ++i)
+        {
+            if (shapes[i].dim != outputShape.size())
+            {
+                throw std::invalid_argument("All tensors must have the same number of dimensions.");
+            }
+            for (size_t j = 0; j < outputShape.size(); ++j)
+            {
+                if (j == axis)
+                {
+                    outputShape[j] += shapes[i].shape[j];
+                }
+                else if (shapes[i].shape[j] != outputShape[j])
+                {
+                    throw std::invalid_argument("Shapes of tensors must match except in the concatenation axis.");
+                }
+            }
+        }
+        return Shape(outputShape);
+    }
+
+   //broadcast
     std::vector<int> broadcastShape(const std::vector<int> &a, const std::vector<int> &b)
     {
         int len1 = a.size();
diff --git a/excuter/cpp-common/src/deepx/shape_changeshape.hpp b/excuter/cpp-common/src/deepx/shape_changeshape.hpp
new file mode 100644
index 00000000..291c7291
--- /dev/null
+++ b/excuter/cpp-common/src/deepx/shape_changeshape.hpp
@@ -0,0 +1,76 @@
+#ifndef DEEPX_SHAPE_CHANGESHAPE_HPP
+#define DEEPX_SHAPE_CHANGESHAPE_HPP
+
+#include <vector>
+#include <numeric>
+#include <algorithm>
+#include <stdexcept>
+#include "deepx/tensor.hpp"
+#include "deepx/shape.hpp"
+#include "stdutil/error.hpp"
+
+namespace deepx
+{
+    // transpose
+
+    using namespace std;
+    std::vector<int> swaplastTwoDimOrder(const std::vector<int> &shape);
+
+    std::vector<int> transposeShape(const std::vector<int> &shape, const std::vector<int> &dimOrder);
+
+    // concat
+
+    Shape concatShape(const std::vector<Shape> &shapes, const int axis);
+
+    template <typename T>
+    Shape concatShape(const std::vector<Tensor<T> *> &tensors, const int axis)
+    {
+        std::vector<Shape> shapes;
+        for (int i = 0; i < tensors.size(); ++i)
+        {
+            shapes.push_back(tensors[i]->shape);
+        }
+        return concatShape(shapes, axis);
+    }
+
+    template <typename T>
+    bool checkShapeConcat(const std::vector<Tensor<T> *> &tensors, const int axis, const Tensor<T> &output)
+    {
+        int axisDim = 0;
+        for (int i = 0; i < tensors.size(); i++)
+        {
+            if (tensors[i]->shape.dim != output.shape.dim)
+            {
+                throw TensorShapeError("All input tensors must have the same dimension size for concat");
+            }
+            for (int j = 0; j < tensors[i]->shape.dim; j++)
+            {
+                if (j != axis)
+                {
+                    if (tensors[i]->shape[j] != output.shape[j])
+                    {
+                        throw TensorShapeError("All input tensors must have the same dimension size for concat");
+                    }
+                }
+                else
+                {
+                    axisDim += tensors[i]->shape[j];
+                }
+            }
+        }
+        return axisDim == output.shape[axis];
+    }
+
+    // broadcast
+    std::vector<int> broadcastShape(const std::vector<int> &a, const std::vector<int> &b);
+    enum BroadcastMap
+    {
+        xTox = 0,
+        nullTo1 = 1,
+        xTo1 = 2,
+    };
+    std::vector<BroadcastMap> broadcastMap(const std::vector<int> &a, const std::vector<int> &b);
+
+}
+
+#endif // DEEPX_SHAPE_CHANGESHAPE_HPP
\ No newline at end of file
diff --git a/excuter/cpp-common/src/deepx/shape_concat.cpp b/excuter/cpp-common/src/deepx/shape_concat.cpp
deleted file mode 100644
index 597ba5b2..00000000
--- a/excuter/cpp-common/src/deepx/shape_concat.cpp
+++ /dev/null
@@ -1,30 +0,0 @@
-#include <stdexcept>
-#include <vector>
-#include "deepx/shape_concat.hpp"
-
-namespace deepx
-{
-    Shape concatShape(const std::vector<Shape> &shapes,const int axis){
-        std::vector<int> outputShape(shapes[0].dim);
-        outputShape=shapes[0].shape;
-        for (int i = 1; i < shapes.size(); ++i)
-        {
-            if (shapes[i].dim != outputShape.size())
-            {
-                throw std::invalid_argument("All tensors must have the same number of dimensions.");
-            }
-            for (size_t j = 0; j < outputShape.size(); ++j)
-            {
-                if (j == axis)
-                {
-                    outputShape[j] += shapes[i].shape[j];
-                }
-                else if (shapes[i].shape[j] != outputShape[j])
-                {
-                    throw std::invalid_argument("Shapes of tensors must match except in the concatenation axis.");
-                }
-            }
-        }
-        return Shape(outputShape);
-    }
-}
\ No newline at end of file
diff --git a/excuter/cpp-common/src/deepx/shape_concat.hpp b/excuter/cpp-common/src/deepx/shape_concat.hpp
deleted file mode 100644
index 91884e5e..00000000
--- a/excuter/cpp-common/src/deepx/shape_concat.hpp
+++ /dev/null
@@ -1,50 +0,0 @@
-#ifndef DEEPX_SHAPE_CONCAT_HPP
-#define DEEPX_SHAPE_CONCAT_HPP
-
-#include "deepx/shape.hpp"
-#include "deepx/tensor.hpp"
-#include "stdutil/error.hpp"
-
-namespace deepx
-{
-
-    Shape concatShape(const std::vector<Shape> &shapes,const int axis);
-
-    template<typename T>
-    Shape concatShape(const std::vector<Tensor<T>*> &tensors,const int axis){
-        std::vector<Shape> shapes;
-        for (int i = 0; i < tensors.size(); ++i)
-        {
-            shapes.push_back(tensors[i]->shape);
-        }
-        return concatShape(shapes,axis);
-    }
-
-    template<typename T>
-    bool checkShapeConcat(const std::vector<Tensor<T>*> &tensors,const int axis,const Tensor<T> &output){
-        int axisDim=0;
-        for (int i = 0; i < tensors.size(); i++)
-        {
-            if (tensors[i]->shape.dim != output.shape.dim)
-            {
-                throw TensorShapeError("All input tensors must have the same dimension size for concat");
-            }
-            for (int j = 0; j < tensors[i]->shape.dim; j++)
-            {
-                if (j != axis)
-                {   
-                    if (tensors[i]->shape[j] != output.shape[j])
-                    {
-                        throw TensorShapeError("All input tensors must have the same dimension size for concat");
-                    }
-                }
-                else
-                {
-                    axisDim += tensors[i]->shape[j];
-                }
-            }
-        }
-        return axisDim == output.shape[axis];
-    }
-};
-#endif // DEEPX_SHAPE_CONCAT_HPP
\ No newline at end of file
diff --git a/excuter/cpp-common/src/deepx/shape_reduce.cpp b/excuter/cpp-common/src/deepx/shape_reduce.cpp
index 0a64eb65..2f017a9b 100644
--- a/excuter/cpp-common/src/deepx/shape_reduce.cpp
+++ b/excuter/cpp-common/src/deepx/shape_reduce.cpp
@@ -3,60 +3,65 @@
 #include <algorithm>
 #include <stdexcept>
 
+#include "stdutil/error.hpp"
 #include "deepx/shape_reduce.hpp"
 
 namespace deepx
 {
-  std::vector<int> reduceDimMap(const Shape &shape, const std::vector<int> &dims)
+    std::vector<int> checkedDims(const std::vector<int> &inputshape, const std::vector<int> &dims)
     {
-        // Step 1: 确定输出形状
-        std::vector<int> sumDims;
+        std::vector<int> checkeddims;
+        // 如果dims为空，则求和所有维度
         if (dims.empty())
         {
-            for (int i = 0; i < shape.dim; ++i)
+            for (int i = 0; i < inputshape.size(); ++i)
             {
-                sumDims.push_back(i);
+                checkeddims.push_back(i);
             }
         }
         else
-        {
-            sumDims = std::vector<int>(dims.data(), dims.data() + dims.size());
-        }
-        std::sort(sumDims.begin(), sumDims.end());
-        // 去重
-        sumDims.erase(std::unique(sumDims.begin(), sumDims.end()), sumDims.end());
-
-        // 验证维度
-        for (int d : sumDims)
-        {
-            if (d < 0 || d >= shape.dim)
+        {   
+            // 验证维度
+            for (int d : dims)
             {
-                throw std::invalid_argument("Dimension out of range in sum");
+                if (d < 0)
+                {
+                    d = inputshape.size() + d;
+                }
+                if (d >= inputshape.size())
+                {
+                    throw TensorShapeError("Dimension out of range in sum");
+                }
+                checkeddims.push_back(d);
             }
         }
 
-        // 创建一个映射数组，标记哪些维度需要求和
-        std::vector<int> sumMap(shape.dim, 0);
-        for (int dim : sumDims)
-        {
-            sumMap[dim] = 1;
-        }
-        return sumMap;
+        // 排序
+        std::sort(checkeddims.begin(), checkeddims.end());
+        // 去重
+        checkeddims.erase(std::unique(checkeddims.begin(), checkeddims.end()), checkeddims.end());
+
+        return checkeddims;
     }
-    std::vector<int> reduceShape(const Shape &a, const std::vector<int> &dims)
+
+    std::vector<int> reducedShape(const std::vector<int> &inputshape, const std::vector<int> &dims, const bool keepdim)
     {
-        
+
         // 创建一个映射数组，标记哪些维度需要求和
-        std::vector<int> reduceMap = reduceDimMap(a, dims);
+        std::vector<int> reducedims = reducedDim(inputshape, dims);
 
         // 计算输出形状
         std::vector<int> outputShape;
 
-        for (size_t i = 0; i < a.dim; ++i)
+        for (size_t i = 0; i < inputshape.size(); ++i)
         {
-            if (reduceMap[i] == 0)
+            if (reducedims[i] == 0)
+            {
+                outputShape.push_back(inputshape[i]);
+            }
+            else if (keepdim)
             {
-                outputShape.push_back(a[i]);
+                outputShape.push_back(1);
             }
         }
 
@@ -66,5 +71,16 @@ namespace deepx
             outputShape.push_back(1);
         }
         return outputShape;
-    }   
+    }
+
+    std::vector<int> reducedDim(const std::vector<int> &shape, const std::vector<int> &dims)
+    {
+        // 创建一个映射数组，标记哪些维度需要求和
+        std::vector<int> sumMap(shape.size(), 0);
+        for (int dim : dims)
+        {
+            sumMap[dim] = 1;
+        }
+        return sumMap;
+    }
 }
\ No newline at end of file
diff --git a/excuter/cpp-common/src/deepx/shape_reduce.hpp b/excuter/cpp-common/src/deepx/shape_reduce.hpp
index 54093ebb..ac15d4e7 100644
--- a/excuter/cpp-common/src/deepx/shape_reduce.hpp
+++ b/excuter/cpp-common/src/deepx/shape_reduce.hpp
@@ -5,8 +5,15 @@
 
 namespace deepx
 {
-        std::vector<int> reduceDimMap(const Shape &shape, const std::vector<int> &dims);
-        std::vector<int> reduceShape(const Shape &a, const std::vector<int> &dims);
+
+        // 检查dims参数是否合法,返回整理后的dims
+        std::vector<int> checkedDims(const std::vector<int> &inputshape, const std::vector<int> &dims);
+
+        // 返回求和后的形状     
+        std::vector<int> reducedShape(const std::vector<int> &inputshape, const std::vector<int> &dims, const bool keepdim = false);
+
+        // 返回需要求和的维度
+        std::vector<int> reducedDim(const std::vector<int> &inputshape, const std::vector<int> &dims );
 }
 
 #endif // DEEPX_SHAPE_SUM_HPP
\ No newline at end of file
diff --git a/excuter/cpp-common/src/deepx/shape_transpose.hpp b/excuter/cpp-common/src/deepx/shape_transpose.hpp
deleted file mode 100644
index c41c7875..00000000
--- a/excuter/cpp-common/src/deepx/shape_transpose.hpp
+++ /dev/null
@@ -1,34 +0,0 @@
-#ifndef DEEPX_SHAPE_TRANSPOSE_HPP
-#define DEEPX_SHAPE_TRANSPOSE_HPP
-
-#include <vector>
-#include <numeric>
-#include <algorithm>
-#include <stdexcept>
-#include "deepx/shape.hpp"
-
-namespace deepx
-{
-    using namespace std;
-    std::vector<int> swaplastTwoDimOrder(const std::vector<int> &shape)
-    {
-        vector<int> dimOrder = shape;
-        std::iota(dimOrder.begin(), dimOrder.end(), 0);
-        swap(dimOrder[dimOrder.size() - 1], dimOrder[dimOrder.size() - 2]);
-        return dimOrder;
-    }
-    std::vector<int> transposeShape(const std::vector<int> &shape, const std::vector<int> &dimOrder)
-    {
-        if (dimOrder.size() != shape.size())
-        {
-            throw std::invalid_argument("dimOrder size does not match the number of dimensions in the TensorCPU.");
-        }
-        std::vector<int> newShape = shape;
-        for (size_t i = 0; i < dimOrder.size(); ++i)
-        {
-            newShape[i] =shape[dimOrder[i]];
-        }
-        return newShape;
-    }
-}
-#endif // DEEPX_SHAPE_TRANSPOSE_HPP
diff --git a/excuter/cpp-common/src/deepx/tf/tf.hpp b/excuter/cpp-common/src/deepx/tf/tf.hpp
index f5b17204..4329fb47 100644
--- a/excuter/cpp-common/src/deepx/tf/tf.hpp
+++ b/excuter/cpp-common/src/deepx/tf/tf.hpp
@@ -25,9 +25,11 @@ namespace deepx::tf
     {
         TypeDef dtype;
         string textvalue;
-        any value;
+ 
         Param(const string &textvalue = "", const DataCategory &dt = DataCategory::Unknown, const Precision &prec = Precision::Any)
             : textvalue(textvalue), dtype(make_dtype(dt, prec)) {}
+
+        
     };
 
     // TF:Tensor Function的缩写
@@ -75,6 +77,29 @@ namespace deepx::tf
             {
                 throw std::invalid_argument("Invalid argument index");
             }
+            // 处理布尔类型
+            if constexpr (std::is_same<T, bool>::value)
+            {
+                const string &value = vars[idx].textvalue;
+                // 转换为小写再判断
+                string lower_value = value;
+                std::transform(lower_value.begin(), lower_value.end(), lower_value.begin(),
+                               [](unsigned char c)
+                               { return std::tolower(c); });
+
+                if (lower_value == "true")
+                {
+                    return true;
+                }
+                else if (lower_value == "false")
+                {
+                    return false;
+                }
+                else
+                {
+                    throw std::invalid_argument("Invalid bool value:" + value);
+                }
+            }
             if (is_float(vars[idx].textvalue))
             {
                 T value = T(std::stof(vars[idx].textvalue));
@@ -83,10 +108,8 @@ namespace deepx::tf
             return mem->getarg<T>(vars[idx].textvalue);
         }
 
-        
-
         template <typename T>
-        vector<T> getvector(int idx,bool arg = true)
+        vector<T> getvector(int idx, bool arg = true)
         {
             vector<Param> &vars = arg ? args : returns;
             if (idx < 0)
diff --git a/excuter/op-mem-cuda/src/deepx/tensorfunc/changeshape_miaobyte.cu b/excuter/op-mem-cuda/src/deepx/tensorfunc/changeshape_miaobyte.cu
index 92940d90..ac395c3f 100644
--- a/excuter/op-mem-cuda/src/deepx/tensorfunc/changeshape_miaobyte.cu
+++ b/excuter/op-mem-cuda/src/deepx/tensorfunc/changeshape_miaobyte.cu
@@ -7,7 +7,7 @@
 #include "deepx/tensorfunc/authors.hpp"
 #include "deepx/tensorfunc/tensor_cuda.cuh"
 #include "deepx/tensorfunc/vector_cuda.cuh"
-#include "deepx/shape_broadcast.hpp"
+#include "deepx/shape_changeshape.hpp"
 
 namespace deepx::tensorfunc
 {
diff --git a/excuter/op-mem-cuda/src/deepx/tensorfunc/changeshape_miaobyte.cuh b/excuter/op-mem-cuda/src/deepx/tensorfunc/changeshape_miaobyte.cuh
index e44874ea..f9f47f7b 100644
--- a/excuter/op-mem-cuda/src/deepx/tensorfunc/changeshape_miaobyte.cuh
+++ b/excuter/op-mem-cuda/src/deepx/tensorfunc/changeshape_miaobyte.cuh
@@ -4,7 +4,7 @@
 #include <cuda_bf16.h>
 #include <cuda_fp16.h>
 
-#include "deepx/shape_broadcast.hpp"
+#include "deepx/shape_changeshape.hpp"
 #include "deepx/tensorfunc/cuda.hpp"
 #include "deepx/tensorfunc/authors.hpp"
 
diff --git a/excuter/op-mem-cuda/src/deepx/tensorfunc/changeshape_miaobyte.hpp b/excuter/op-mem-cuda/src/deepx/tensorfunc/changeshape_miaobyte.hpp
index 1faf58e7..6f76fa23 100644
--- a/excuter/op-mem-cuda/src/deepx/tensorfunc/changeshape_miaobyte.hpp
+++ b/excuter/op-mem-cuda/src/deepx/tensorfunc/changeshape_miaobyte.hpp
@@ -8,8 +8,7 @@
 #include "deepx/tensorfunc/authors.hpp"
 #include "deepx/tensorfunc/changeshape_miaobyte.cuh"
 #include "deepx/tensorfunc/cuda.hpp"
-#include "deepx/shape_concat.hpp"
-#include "deepx/shape_broadcast.hpp"
+#include "deepx/shape_changeshape.hpp"
 #include "stdutil/error.hpp"
 namespace deepx::tensorfunc
 {
diff --git a/excuter/op-mem-ompsimd/src/client/tfs.cpp b/excuter/op-mem-ompsimd/src/client/tfs.cpp
index d81306ee..2c675170 100644
--- a/excuter/op-mem-ompsimd/src/client/tfs.cpp
+++ b/excuter/op-mem-ompsimd/src/client/tfs.cpp
@@ -7,6 +7,7 @@
 #include "deepx/tf/io.hpp"
 #include "deepx/tf/changeshape.hpp"
 #include "deepx/tf/elementwise.hpp"
+#include "deepx/tf/reduce.hpp"
 #include "deepx/tf/tffactory.hpp"
 #include "deepx/tf/matmul.hpp"
 #include "deepx/tensorfunc/authors.hpp"
@@ -17,6 +18,7 @@ namespace deepx::tf
     // tensor
     void register_lifecycle(TfFactory &tffactory)
     {
+        // argset author=miaobyte
         tffactory.add_tf(std::make_shared<ArgSet>(vector<Param>(
                                                       {
                                                           Param("value", DataCategory::Var, Precision::Any),
@@ -25,6 +27,7 @@ namespace deepx::tf
                                                       {
                                                           Param("name", DataCategory::Var, Precision::Any),
                                                       })));
+        // vecset author=miaobyte
         tffactory.add_tf(std::make_shared<VecSet>(
             vector<Param>(
                 {
@@ -34,6 +37,7 @@ namespace deepx::tf
                 {
                     Param("name", DataCategory::Vector, Precision::Any),
                 })));
+        // newtensor author=miaobyte
         tffactory.add_tf(std::make_shared<NewTensor>(vector<Param>(
                                                          {
                                                              Param("shape", DataCategory::Vector, Precision::Int32),
@@ -42,6 +46,7 @@ namespace deepx::tf
                                                          {
                                                              Param("tensor1", DataCategory::Tensor, Precision::Any),
                                                          })));
+        // newtensor author=miaobyte
         tffactory.add_tf(std::make_shared<NewTensor>(vector<Param>(
                                                          {
                                                              Param("shape", DataCategory::Var, Precision::String),
@@ -50,22 +55,19 @@ namespace deepx::tf
                                                          {
                                                              Param("tensor1", DataCategory::Tensor, Precision::Any),
                                                          })));
-        // opfactory.add_op(DelTensor<float>());
     }
 
     // init
     void register_init(TfFactory &tffactory)
     {
-        //     opfactory.add_op(Uniform<float>());
-        //     opfactory.add_op(Uniform<double>());
-
+        // constant author=miaobyte
         tffactory.add_tf(std::make_shared<Constant<miaobyte>>(vector<Param>(
                                                                   {
                                                                       Param("t", DataCategory::Tensor, Precision::Any),
                                                                       Param("value", DataCategory::Var, Precision::Any),
                                                                   }),
                                                               vector<Param>()));
-
+        // arange author=miaobyte
         tffactory.add_tf(std::make_shared<Arange<miaobyte>>(vector<Param>(
                                                                 {
                                                                     Param("t", DataCategory::Tensor, Precision::Any),
@@ -73,6 +75,7 @@ namespace deepx::tf
                                                                     Param("step", DataCategory::Var, Precision::Any),
                                                                 }),
                                                             vector<Param>()));
+        // uniform author=miaobyte
         tffactory.add_tf(std::make_shared<Uniform<miaobyte>>(vector<Param>(
                                                                  {
                                                                      Param("t", DataCategory::Tensor, Precision::Any),
@@ -85,12 +88,13 @@ namespace deepx::tf
     // io
     void register_util(TfFactory &opfactory)
     {
+        // print author=miaobyte
         opfactory.add_tf(std::make_shared<Print<miaobyte>>(vector<Param>(
                                                                {
                                                                    Param("", DataCategory::Tensor, Precision::Any),
                                                                }),
                                                            vector<Param>()));
-
+        // print author=miaobyte
         opfactory.add_tf(std::make_shared<Print<miaobyte>>(vector<Param>(
                                                                {
                                                                    Param("", DataCategory::Tensor, Precision::Any),
@@ -111,7 +115,7 @@ namespace deepx::tf
                                                              {
                                                                  Param("c", DataCategory::Tensor, Precision::Any),
                                                              })));
-
+        // add author=cblas
         tffactory.add_tf(std::make_shared<Add<cblas>>(vector<Param>(
                                                           {
                                                               Param("a", DataCategory::Tensor, Precision::Float64 | Precision::Float32),
@@ -122,6 +126,7 @@ namespace deepx::tf
                                                               Param("c", DataCategory::Tensor, Precision::Float64 | Precision::Float32),
                                                           })));
 
+        // add scalar author=miaobyte
         tffactory.add_tf(std::make_shared<AddScalar<miaobyte>>(vector<Param>(
                                                                    {
                                                                        Param("a", DataCategory::Tensor, Precision::Any),
@@ -131,6 +136,7 @@ namespace deepx::tf
                                                                    {
                                                                        Param("c", DataCategory::Tensor, Precision::Any),
                                                                    })));
+        // sub author=miaobyte
         tffactory.add_tf(std::make_shared<Sub<miaobyte>>(vector<Param>(
                                                              {
                                                                  Param("a", DataCategory::Tensor, Precision::Any),
@@ -140,7 +146,7 @@ namespace deepx::tf
                                                              {
                                                                  Param("c", DataCategory::Tensor, Precision::Any),
                                                              })));
-
+        // sub scalar author=miaobyte
         tffactory.add_tf(std::make_shared<SubScalar<miaobyte>>(vector<Param>(
                                                                    {
                                                                        Param("a", DataCategory::Tensor, Precision::Any),
@@ -150,7 +156,7 @@ namespace deepx::tf
                                                                    {
                                                                        Param("c", DataCategory::Tensor, Precision::Any),
                                                                    })));
-
+        // mul author=miaobyte
         tffactory.add_tf(std::make_shared<Mul<miaobyte>>(vector<Param>(
                                                              {
                                                                  Param("A", DataCategory::Tensor, Precision::Any),
@@ -160,6 +166,7 @@ namespace deepx::tf
                                                              {
                                                                  Param("C", DataCategory::Tensor, Precision::Any),
                                                              })));
+        // mul scalar author=miaobyte
         tffactory.add_tf(std::make_shared<MulScalar<miaobyte>>(vector<Param>(
                                                                    {
                                                                        Param("A", DataCategory::Tensor, Precision::Any),
@@ -179,6 +186,7 @@ namespace deepx::tf
                                                              {
                                                                  Param("C", DataCategory::Tensor, Precision::Any),
                                                              })));
+        // div scalar author=miaobyte
         tffactory.add_tf(std::make_shared<DivScalar<miaobyte>>(vector<Param>(
                                                                    {
                                                                        Param("A", DataCategory::Tensor, Precision::Any),
@@ -198,6 +206,7 @@ namespace deepx::tf
                                                                     {
                                                                         Param("C", DataCategory::Tensor, Precision::Any),
                                                                     })));
+        // sqrt author=miaobyte
         tffactory.add_tf(std::make_shared<Sqrt<miaobyte>>(vector<Param>(
                                                               {
                                                                   Param("A", DataCategory::Tensor, Precision::Any),
@@ -207,6 +216,7 @@ namespace deepx::tf
                                                                   Param("C", DataCategory::Tensor, Precision::Any),
                                                               })));
 
+        // pow author=miaobyte
         tffactory.add_tf(std::make_shared<Pow<miaobyte>>(vector<Param>(
                                                              {
                                                                  Param("A", DataCategory::Tensor, Precision::Any),
@@ -216,6 +226,7 @@ namespace deepx::tf
                                                              {
                                                                  Param("C", DataCategory::Tensor, Precision::Any),
                                                              })));
+        // pow scalar author=miaobyte
         tffactory.add_tf(std::make_shared<PowScalar<miaobyte>>(vector<Param>(
                                                                    {
                                                                        Param("A", DataCategory::Tensor, Precision::Any),
@@ -225,6 +236,7 @@ namespace deepx::tf
                                                                    {
                                                                        Param("C", DataCategory::Tensor, Precision::Any),
                                                                    })));
+        // log author=miaobyte
         tffactory.add_tf(std::make_shared<Log<miaobyte>>(vector<Param>(
                                                              {
                                                                  Param("A", DataCategory::Tensor, Precision::Any),
@@ -233,6 +245,7 @@ namespace deepx::tf
                                                              {
                                                                  Param("C", DataCategory::Tensor, Precision::Any),
                                                              })));
+        // exp author=miaobyte
         tffactory.add_tf(std::make_shared<Exp<miaobyte>>(vector<Param>(
                                                              {
                                                                  Param("A", DataCategory::Tensor, Precision::Any),
@@ -241,6 +254,7 @@ namespace deepx::tf
                                                              {
                                                                  Param("C", DataCategory::Tensor, Precision::Any),
                                                              })));
+        // max author=miaobyte
         tffactory.add_tf(std::make_shared<Max<miaobyte>>(vector<Param>(
                                                              {
                                                                  Param("A", DataCategory::Tensor, Precision::Any),
@@ -250,6 +264,7 @@ namespace deepx::tf
                                                              {
                                                                  Param("C", DataCategory::Tensor, Precision::Any),
                                                              })));
+        // max scalar author=miaobyte
         tffactory.add_tf(std::make_shared<MaxScalar<miaobyte>>(vector<Param>(
                                                                    {
                                                                        Param("A", DataCategory::Tensor, Precision::Any),
@@ -259,6 +274,7 @@ namespace deepx::tf
                                                                    {
                                                                        Param("C", DataCategory::Tensor, Precision::Any),
                                                                    })));
+        // min author=miaobyte
         tffactory.add_tf(std::make_shared<Min<miaobyte>>(vector<Param>(
                                                              {
                                                                  Param("A", DataCategory::Tensor, Precision::Any),
@@ -268,6 +284,7 @@ namespace deepx::tf
                                                              {
                                                                  Param("C", DataCategory::Tensor, Precision::Any),
                                                              })));
+        // min scalar author=miaobyte
         tffactory.add_tf(std::make_shared<MinScalar<miaobyte>>(vector<Param>(
                                                                    {
                                                                        Param("A", DataCategory::Tensor, Precision::Any),
@@ -277,6 +294,7 @@ namespace deepx::tf
                                                                    {
                                                                        Param("C", DataCategory::Tensor, Precision::Any),
                                                                    })));
+        // compare author=miaobyte
         tffactory.add_tf(std::make_shared<Compare<miaobyte>>(vector<Param>(
                                                                  {
                                                                      Param("A", DataCategory::Tensor, Precision::Any),
@@ -287,6 +305,7 @@ namespace deepx::tf
                                                                  {
                                                                      Param("mask", DataCategory::Tensor, Precision::Float32),
                                                                  })));
+        // compare scalar author=miaobyte
         tffactory.add_tf(std::make_shared<CompareScalar<miaobyte>>(vector<Param>(
                                                                        {
                                                                            Param("A", DataCategory::Tensor, Precision::Any),
@@ -300,6 +319,7 @@ namespace deepx::tf
     // matmul
     void register_matmul(TfFactory &tffactory)
     {
+        // matmul author=miaobyte
         tffactory.add_tf(std::make_shared<MatMul<miaobyte>>(vector<Param>(
                                                                 {
                                                                     Param("A", DataCategory::Tensor, Precision::Any),
@@ -309,6 +329,7 @@ namespace deepx::tf
                                                                 {
                                                                     Param("C", DataCategory::Tensor, Precision::Any),
                                                                 })));
+        // matmul author=cblas
         tffactory.add_tf(std::make_shared<MatMul<cblas>>(vector<Param>(
                                                              {
                                                                  Param("A", DataCategory::Tensor, Precision::Float64 | Precision::Float32),
@@ -322,7 +343,7 @@ namespace deepx::tf
     // // changeshape
     void register_changeshape(TfFactory &tffactory)
     {
-        
+        // reshape author=miaobyte
         tffactory.add_tf(std::make_shared<Reshape<miaobyte>>(vector<Param>(
                                                                  {
                                                                      Param("A", DataCategory::Tensor, Precision::Any),
@@ -334,48 +355,84 @@ namespace deepx::tf
                                                                  })));
 
         tffactory.add_tf(std::make_shared<Transpose<miaobyte>>(vector<Param>(
-                {
-                    Param("A", DataCategory::Tensor, Precision::Any),
-                    Param("dim_order", DataCategory::Vector, Precision::Int32),
-                }),
-            vector<Param>(
-                {
-                    Param("C", DataCategory::Tensor, Precision::Any),
-                })));
-
+                                                                   {
+                                                                       Param("A", DataCategory::Tensor, Precision::Any),
+                                                                       Param("dim_order", DataCategory::Vector, Precision::Int32),
+                                                                   }),
+                                                               vector<Param>(
+                                                                   {
+                                                                       Param("C", DataCategory::Tensor, Precision::Any),
+                                                                   })));
+        // concat author=miaobyte
         tffactory.add_tf(std::make_shared<Concat<miaobyte>>(vector<Param>(
-                {
-                    Param("tensors", DataCategory::ListTensor, Precision::Any),
-                    Param("axis", DataCategory::Var, Precision::Int32),
-                }),
-            vector<Param>(
-                {
-                    Param("result", DataCategory::Tensor, Precision::Any),
-                })));
+                                                                {
+                                                                    Param("tensors", DataCategory::ListTensor, Precision::Any),
+                                                                    Param("axis", DataCategory::Var, Precision::Int32),
+                                                                }),
+                                                            vector<Param>(
+                                                                {
+                                                                    Param("result", DataCategory::Tensor, Precision::Any),
+                                                                })));
+        // broadcastto author=miaobyte
         tffactory.add_tf(std::make_shared<BroadcastTo<miaobyte>>(vector<Param>(
-                {
-                    Param("A", DataCategory::Tensor, Precision::Any),
-                    Param("new_shape", DataCategory::Vector, Precision::Int32),
-                }),
-            vector<Param>(
-                {
-                    Param("B", DataCategory::Tensor, Precision::Any),
-                })));
+                                                                     {
+                                                                         Param("A", DataCategory::Tensor, Precision::Any),
+                                                                         Param("new_shape", DataCategory::Vector, Precision::Int32),
+                                                                     }),
+                                                                 vector<Param>(
+                                                                     {
+                                                                         Param("B", DataCategory::Tensor, Precision::Any),
+                                                                     })));
     }
     // // reduce
-    // void register_reduce(OpFactory &opfactory)
-    // {
-    //     opfactory.add_op(Max<float>());
-    //     opfactory.add_op(Max<double>());
-    //     opfactory.add_op(Maxscalar<float>());
-    //     opfactory.add_op(Maxscalar<double>());
-    //     opfactory.add_op(Min<float>());
-    //     opfactory.add_op(Min<double>());
-    //     opfactory.add_op(Minscalar<float>());
-    //     opfactory.add_op(Minscalar<double>());
-    //     opfactory.add_op(Sum<float>());
-    //     opfactory.add_op(Sum<double>());
-    // }
+    void register_reduce(TfFactory &tffactory)
+    {
+        // sum author=miaobyte
+        tffactory.add_tf(std::make_shared<Sum<miaobyte>>(vector<Param>(
+                                                             {
+                                                                 Param("A", DataCategory::Tensor, Precision::Any),
+                                                                 Param("axis", DataCategory::Vector, Precision::Int32),
+                                                                 Param("keepdims", DataCategory::Var, Precision::Bool),
+                                                             }),
+                                                         vector<Param>(
+                                                             {
+                                                                 Param("B", DataCategory::Tensor, Precision::Any),
+                                                             })));
+        // prod author=miaobyte
+        tffactory.add_tf(std::make_shared<Prod<miaobyte>>(vector<Param>(
+                                                              {
+                                                                  Param("A", DataCategory::Tensor, Precision::Any),
+                                                                  Param("axis", DataCategory::Vector, Precision::Int32),
+                                                                  Param("keepdims", DataCategory::Var, Precision::Bool),
+                                                              }),
+                                                          vector<Param>(
+                                                              {
+                                                                  Param("B", DataCategory::Tensor, Precision::Any),
+                                                                 })));
+        // reducemax author=miaobyte
+        tffactory.add_tf(std::make_shared<ReduceMax<miaobyte>>(vector<Param>(
+                                                                 {
+                                                                     Param("A", DataCategory::Tensor, Precision::Any),
+                                                                     Param("axis", DataCategory::Vector, Precision::Int32),
+                                                                     Param("keepdims", DataCategory::Var, Precision::Bool),
+                                                                 }),
+                                                                 vector<Param>(
+                                                                     {
+                                                                         Param("B", DataCategory::Tensor, Precision::Any),
+                                                                     })));
+        // reducemin author=miaobyte
+        tffactory.add_tf(std::make_shared<ReduceMin<miaobyte>>(vector<Param>(
+                                                                 {
+                                                                     Param("A", DataCategory::Tensor, Precision::Any),
+                                                                     Param("axis", DataCategory::Vector, Precision::Int32),
+                                                                     Param("keepdims", DataCategory::Var, Precision::Bool),
+                                                                 }),
+                                                                 vector<Param>(
+                                                                     {
+                                                                         Param("B", DataCategory::Tensor, Precision::Any),
+                                                                     })));
+    }
+ 
     int register_all(TfFactory &tffactory)
     {
         register_lifecycle(tffactory);
@@ -384,7 +441,7 @@ namespace deepx::tf
         register_elementwise(tffactory);
         register_matmul(tffactory);
         register_changeshape(tffactory);
-        // register_reduce(opfactory);
+        register_reduce(tffactory);
         return 0;
     }
 }
\ No newline at end of file
diff --git a/excuter/op-mem-ompsimd/src/deepx/tensorfunc/changeshape_miaobyte.hpp b/excuter/op-mem-ompsimd/src/deepx/tensorfunc/changeshape_miaobyte.hpp
index f62146ac..46f5a0b8 100644
--- a/excuter/op-mem-ompsimd/src/deepx/tensorfunc/changeshape_miaobyte.hpp
+++ b/excuter/op-mem-ompsimd/src/deepx/tensorfunc/changeshape_miaobyte.hpp
@@ -5,8 +5,7 @@
 #include <vector>
 
 #include "deepx/tensor.hpp"
-#include "deepx/shape_concat.hpp"
-#include "deepx/shape_broadcast.hpp"
+#include "deepx/shape_changeshape.hpp"
 #include "deepx/tensorfunc/new.hpp"
 #include "deepx/tensorfunc/changeshape.hpp"
 #include "deepx/tensorfunc/authors.hpp"
diff --git a/excuter/op-mem-ompsimd/src/deepx/tensorfunc/highway.hpp b/excuter/op-mem-ompsimd/src/deepx/tensorfunc/highway.hpp
new file mode 100644
index 00000000..ec18b89a
--- /dev/null
+++ b/excuter/op-mem-ompsimd/src/deepx/tensorfunc/highway.hpp
@@ -0,0 +1,23 @@
+#ifndef DEEPX_TENSORFUNC_HIGHWAY_HPP
+#define DEEPX_TENSORFUNC_HIGHWAY_HPP
+
+#include <hwy/highway.h>
+
+namespace deepx::tensorfunc
+{
+    using namespace hwy::HWY_NAMESPACE;
+
+    template <typename T, class D>
+    T ReduceMul(D d, Vec<D> v)
+    {
+        T result = GetLane(v);
+        for (size_t i = 1; i < Lanes(d); ++i)
+        {
+            result *= ExtractLane(v, i);
+        }
+        return result;
+    }
+
+}
+
+#endif
diff --git a/excuter/op-mem-ompsimd/src/deepx/tensorfunc/reduce_miaobyte.hpp b/excuter/op-mem-ompsimd/src/deepx/tensorfunc/reduce_miaobyte.hpp
index 3eb77628..9d7e37c8 100644
--- a/excuter/op-mem-ompsimd/src/deepx/tensorfunc/reduce_miaobyte.hpp
+++ b/excuter/op-mem-ompsimd/src/deepx/tensorfunc/reduce_miaobyte.hpp
@@ -4,10 +4,12 @@
 #include <vector>
 #include <algorithm>
 #include <stdexcept>
-#include <deepx/vector_combination.hpp>
 #include <hwy/highway.h>
 
+#include <deepx/vector_combination.hpp>
 #include "deepx/tensor.hpp"
+
+#include "deepx/tensorfunc/highway.hpp"
 #include "deepx/shape_reduce.hpp"
 #include "deepx/tensorfunc/reduce.hpp"
 #include "deepx/tensorfunc/init_miaobyte.hpp"
@@ -16,175 +18,332 @@ namespace deepx::tensorfunc
 {
     using namespace hwy::HWY_NAMESPACE;
 
+    // sum author=miaobyte
     template <typename T>
     struct sumDispatcher<miaobyte, T>
     {
-        static void sum(const Tensor<T> &tensor, const std::vector<int> &dims, Tensor<T> &result,const bool keepdims)
+        static void sum(const Tensor<T> &tensor, const std::vector<int> &dims, Tensor<T> &result, const bool keepdims)
         {
             constant<miaobyte, T>(result, T(0));
-
-            std::vector<int> sorted_dims = dims;
-            if (dims.size() == 0)
+            std::vector<int> checkeddims = checkedDims(tensor.shape.shape, dims);
+            std::vector<int> reduced_dims = reducedDim(tensor.shape.shape, checkeddims);
+            const int minshape_1 = Lanes(ScalableTag<T>());
+            if (reduced_dims.rbegin()[0] == tensor.shape.dim - 1 || tensor.shape.dim > reduced_dims.size() || tensor.shape[-1] >= minshape_1)
             {
-                sorted_dims = arrange(tensor.shape.dim);
+                tensor.shape.rangeParallel(tensor.shape.dim, [&tensor, &result, &reduced_dims, keepdims](const int idx_linear, const std::vector<int> &indices, std::vector<int> &newIndices)
+                                           {
+                    // 计算输出索引
+                    for (size_t i = 0, j = 0; i < tensor.shape.dim; ++i)
+                    {
+                        if (reduced_dims[i] == 0)
+                        {
+                            newIndices[j++] = indices[i];
+                        }else if (keepdims && (reduced_dims[i] == 1)) {
+                            newIndices[j++] = indices[i];
+                        }
+                    }
+                    int outputIdx = result.shape.linearat(newIndices);
+#pragma omp atomic
+                    result.data[outputIdx] += tensor.data[idx_linear]; }, result.shape.dim);
             }
-            // 从大到小排序
-            std::sort(sorted_dims.begin(), sorted_dims.end(), std::greater<int>());
-            std::vector<int> sumMap = reduceDimMap(tensor.shape, sorted_dims);
-            // 如果dims的最后一个元素是tensor.shape.dim-1，则说明求和的数据不连续（不对齐），无法simd（需要不停跳跃）
-
-            const ScalableTag<T> _tag;
-            size_t minshape_1 = Lanes(_tag);
-            // if (true)
-            if (sorted_dims.rbegin()[0] == tensor.shape.dim - 1 || tensor.shape.dim > sorted_dims.size() || tensor.shape[-1] >= minshape_1)
+            else
+            {
+                // 如果数据连续（对齐），则可以simd
+                tensor.shape.rangeParallel(tensor.shape.dim - 1, [&tensor, &result, &reduced_dims, keepdims](const int idx_linear, const std::vector<int> &indices, std::vector<int> &newIndices)
+                                           {
+                    // 计算输出索引
+                    for (size_t i = 0, j = 0; i < tensor.shape.dim; ++i)
+                    {
+                        if (reduced_dims[i] == 0)
+                        {
+                            newIndices[j++] = indices[i];
+                        }else if (keepdims && (reduced_dims[i] == 1)) {
+                            newIndices[j++] = indices[i];
+                        }
+                    }
+                    int outputIdx = result.shape.linearat(newIndices);
+                    int shape_last = tensor.shape[-1];
+                    const ScalableTag<T> tag;
+                    const size_t lanes = Lanes(tag);
+                    size_t j = 0;
+                    T sum = 0;
+                    // 前部分：处理到对齐
+                    while (j < shape_last && !IsAligned(tag, tensor.data + idx_linear + j))
+                    {
+                        sum += tensor.data[idx_linear + j];
+                        ++j;    
+                    }
+                    // 中间部分：SIMD
+                    size_t aligned_end = shape_last - (shape_last % lanes);
+                    auto sum_vec = Zero(tag);
+                    for (; j + lanes <= aligned_end; j += lanes)
+                    {
+                        auto vec = Load(tag, tensor.data + idx_linear + j);
+                        sum_vec = Add(sum_vec, vec);
+                    }
+                    // 将向量累加结果写回
+                    sum += ReduceSum(tag, sum_vec);
+                    // 尾部分：处理剩余
+                    for (; j < shape_last; ++j)
+                    {
+                        sum += tensor.data[idx_linear + j];
+                    }
+#pragma omp atomic
+                    result.data[outputIdx] += sum; }, result.shape.dim);
+            }
+        }
+    };
+
+    // prod author=miaobyte
+    template <typename T>
+    struct prodDispatcher<miaobyte, T>
+    {
+        static void prod(const Tensor<T> &tensor, const std::vector<int> &dims, Tensor<T> &result, const bool keepdims)
+        {
+            std::vector<int> checkeddims = checkedDims(tensor.shape.shape, dims);
+            std::vector<int> reduced_dims = reducedDim(tensor.shape.shape, checkeddims);
+            const int minshape_1 = Lanes(ScalableTag<T>());
+            // 如果dims的最后一个元素是tensor.shape.dim-1，则说明reduceprod的数据不连续（不对齐），无法simd（需要不停跳跃）
+            constant<miaobyte,T>(result, T(1));
+            if (reduced_dims.rbegin()[0] == tensor.shape.dim - 1 || tensor.shape.dim > reduced_dims.size() || tensor.shape[-1] >= minshape_1)
             {
-                tensor.shape.rangeParallel(tensor.shape.dim, [&tensor, &result, &sumMap](const int idx_linear, const std::vector<int> &indices, std::vector<int> &newIndices)
+                tensor.shape.rangeParallel(tensor.shape.dim, [&tensor, &result, &reduced_dims, keepdims](const int idx_linear, const std::vector<int> &indices, std::vector<int> &newIndices)
                                            {
                             // 计算输出索引
                          
                             for (size_t i = 0,j=0; i < tensor.shape.dim ; ++i) {
-                                if (sumMap[i]==0) {
+                                if (reduced_dims[i]==0) {
+                                        newIndices[j++]=indices[i];
+                                    }else if (keepdims && (reduced_dims[i] == 1)) {
                                         newIndices[j++]=indices[i];
                                     }
                                 }
                             // 累加求和
                             int outputIdx=result.shape.linearat(newIndices);
 #pragma omp atomic
-                            result.data[outputIdx]+=tensor.data[idx_linear]; }, result.shape.dim);
+                            result.data[outputIdx]*=tensor.data[idx_linear]; }, result.shape.dim);
             }
             else
             {
-                // 这里有bug，todo
-                //  如果数据连续（对齐），则可以simd
-                tensor.shape.rangeParallel(tensor.shape.dim - 1, [&tensor, &result, &sumMap](const int idx_linear, const std::vector<int> &indices, std::vector<int> &newIndices)
+                // 如果数据连续（对齐），则可以simd
+                tensor.shape.rangeParallel(tensor.shape.dim - 1, [&tensor, &result, &reduced_dims, keepdims](const int i, const std::vector<int> &indices, std::vector<int> &newIndices)
                                            {
                                                // 计算输出索引
+
                                                for (size_t i = 0, j = 0; i < tensor.shape.dim; ++i)
                                                {
-                                                   if (sumMap[i] == 0)
+                                                   if (reduced_dims[i] == 0)
                                                    {
                                                        newIndices[j++] = indices[i];
+                                                   }else if (keepdims && (reduced_dims[i] == 1)) {
+                                                       newIndices[j++] = indices[i];
                                                    }
                                                }
+                                               // 累加求和
                                                int outputIdx = result.shape.linearat(newIndices);
 
                                                int shape_last = tensor.shape[-1];
                                                const ScalableTag<T> tag;
                                                const size_t lanes = Lanes(tag);
                                                size_t j = 0;
-                                               T sum = 0;
+                                               T product = 1;
                                                // 前部分：处理到对齐
-                                               while (j < shape_last && !IsAligned(tag, tensor.data + idx_linear + j))
+                                               while (j < shape_last && !IsAligned(tag, tensor.data + i + j))
                                                {
-                                                   sum += tensor.data[idx_linear + j];
+                                                   product *= tensor.data[i + j];
                                                    ++j;
                                                }
 
                                                // 中间部分：SIMD
                                                size_t aligned_end = shape_last - (shape_last % lanes);
-                                               auto sum_vec = Zero(tag); // 初始化累加向量为0
+                                               auto product_vec = Load(tag, tensor.data + i + j); // 初始化累乘向量
+                                               j+=lanes;
                                                for (; j + lanes <= aligned_end; j += lanes)
                                                {
-                                                   auto vec = Load(tag, tensor.data + idx_linear + j);
-                                                   sum_vec = Add(sum_vec, vec); // 向量累加
+                                                   auto vec = Load(tag, tensor.data + i + j);
+                                                   product_vec = Mul(product_vec, vec); // 向量累乘
                                                }
 
-                                               // 将向量累加结果写回
-                                               sum += ReduceSum(tag, sum_vec); // 使用ReduceSum替代GetLane(SumOfLane())
+                                               // 将向量累乘结果写回
+                                               product *= ReduceMul<T>(tag,product_vec);
 
                                                // 尾部分：处理剩余
                                                for (; j < shape_last; ++j)
                                                {
-                                                   sum += tensor.data[idx_linear + j];
+                                                   product *= tensor.data[i + j];
                                                }
 #pragma omp atomic
-                                               result.data[outputIdx] += sum; }, result.shape.dim);
+                                               result.data[outputIdx] *= product; }, result.shape.dim);
             }
         }
     };
 
     template <typename T>
-    struct prodDispatcher<miaobyte, T>
+    struct reducemaxDispatcher<miaobyte, T>
     {
-        static void prod(const Tensor<T> &tensor, const std::vector<int> &dims, Tensor<T> &result,const bool keepdims)
+        static void reducemax(const Tensor<T> &tensor, const std::vector<int> &dims, Tensor<T> &result, const bool keepdims)
         {
-
-            std::vector<int> sorted_dims = dims;
-            if (dims.size() == 0)
+            std::vector<int> checkeddims = checkedDims(tensor.shape.shape, dims);
+            std::vector<int> reduced_dims = reducedDim(tensor.shape.shape, checkeddims);
+            const int minshape_1 = Lanes(ScalableTag<T>());
+            // 如果dims的最后一个元素是tensor.shape.dim-1，则说明reducemax的数据不连续（不对齐），无法simd（需要不停跳跃）
+            constant<miaobyte, T>(result, std::numeric_limits<T>::lowest());
+            if (reduced_dims.rbegin()[0] == tensor.shape.dim - 1 || tensor.shape.dim > reduced_dims.size() || tensor.shape[-1] >= minshape_1)
             {
-                sorted_dims = arrange(tensor.shape.dim);
+                tensor.shape.rangeParallel(tensor.shape.dim, [&tensor, &result, &reduced_dims, keepdims](const int idx_linear, const std::vector<int> &indices, std::vector<int> &newIndices)
+                                           {
+                            // 计算输出索引
+                         
+                            for (size_t i = 0,j=0; i < tensor.shape.dim ; ++i) {
+                                if (reduced_dims[i]==0) {
+                                        newIndices[j++]=indices[i];
+                                    }else if (keepdims && (reduced_dims[i] == 1)) {
+                                        newIndices[j++]=indices[i];
+                                    }
+                                }
+                            // 累加求和
+                            int outputIdx=result.shape.linearat(newIndices);
+                            result.data[outputIdx]=std::max(result.data[outputIdx],tensor.data[idx_linear]);
+                            }, result.shape.dim);
+            }
+            else
+            {
+                // 如果数据连续（对齐），则可以simd
+                tensor.shape.rangeParallel(tensor.shape.dim - 1, [&tensor, &result, &reduced_dims, keepdims](const int i, const std::vector<int> &indices, std::vector<int> &newIndices)
+                                           {
+                                               // 计算输出索引
+
+                                               for (size_t i = 0, j = 0; i < tensor.shape.dim; ++i)
+                                               {
+                                                   if (reduced_dims[i] == 0)
+                                                   {
+                                                       newIndices[j++] = indices[i];
+                                                   }else if (keepdims && (reduced_dims[i] == 1)) {
+                                                       newIndices[j++] = indices[i];
+                                                   }
+                                               }
+                                               
+                                               int outputIdx = result.shape.linearat(newIndices);
+
+                                               int shape_last = tensor.shape[-1];
+                                               const ScalableTag<T> tag;
+                                               const size_t lanes = Lanes(tag);
+                                               size_t j = 0;
+                                               T maxt = tensor.data[i];
+                                               // 前部分：处理到对齐
+                                               while (j < shape_last && !IsAligned(tag, tensor.data + i + j))
+                                               {
+                                                   maxt = std::max(maxt,tensor.data[i + j]);
+                                                   ++j;
+                                               }
+
+                                               // 中间部分：SIMD
+                                               size_t aligned_end = shape_last - (shape_last % lanes);
+                                               auto max_vec = Load(tag, tensor.data + i + j); // 初始化累乘向量为1
+                                               for (; j + lanes <= aligned_end; j += lanes)
+                                               {
+                                                   auto vec = Load(tag, tensor.data + i + j);
+                                                   max_vec = Max(max_vec, vec);  
+                                               }
+
+                                               // 将向量累乘结果写回
+                                               maxt = ReduceMax(tag, max_vec);
+
+                                               // 尾部分：处理剩余
+                                               for (; j < shape_last; ++j)
+                                               {
+                                                   maxt = std::max(maxt,tensor.data[i + j]);
+                                               }
+ 
+                                               result.data[outputIdx] = std::max(result.data[outputIdx],maxt);
+                                                }, result.shape.dim);
             }
-            // 从大到小排序
-            std::sort(sorted_dims.begin(), sorted_dims.end(), std::greater<int>());
-            std::vector<int> sumMap = reduceDimMap(tensor.shape, sorted_dims);
-            // 如果dims的最后一个元素是tensor.shape.dim-1，则说明求和的数据不连续（不对齐），无法simd（需要不停跳跃）
-            constant(result, T(1));
-            if (sorted_dims.at(sorted_dims.size() - 1) == tensor.shape.dim - 1 && tensor.shape.dim > sorted_dims.size())
+        }
+    };
+
+    template <typename T>
+    struct reduceminDispatcher<miaobyte, T>
+    {
+        static void reducemin(const Tensor<T> &tensor, const std::vector<int> &dims, Tensor<T> &result, const bool keepdims)
+        {
+            std::vector<int> checkeddims = checkedDims(tensor.shape.shape, dims);
+            std::vector<int> reduced_dims = reducedDim(tensor.shape.shape, checkeddims);
+            const int minshape_1 = Lanes(ScalableTag<T>());
+            // 如果dims的最后一个元素是tensor.shape.dim-1，则说明reducemin的数据不连续（不对齐），无法simd（需要不停跳跃）
+            constant<miaobyte, T>(result, std::numeric_limits<T>::max());
+            if (reduced_dims.rbegin()[0] == tensor.shape.dim - 1 || tensor.shape.dim > reduced_dims.size() || tensor.shape[-1] >= minshape_1)
             {
-                tensor.shape.rangeParallel(tensor.shape.dim, [&tensor, &result, &sumMap](const int idx_linear, const std::vector<int> &indices, std::vector<int> &newIndices)
+                tensor.shape.rangeParallel(tensor.shape.dim, [&tensor, &result, &reduced_dims, keepdims](const int idx_linear, const std::vector<int> &indices, std::vector<int> &newIndices)
                                            {
                             // 计算输出索引
                          
                             for (size_t i = 0,j=0; i < tensor.shape.dim ; ++i) {
-                                if (sumMap[i]==0) {
+                                if (reduced_dims[i]==0) {
+                                        newIndices[j++]=indices[i];
+                                    }else if (keepdims && (reduced_dims[i] == 1)) {
                                         newIndices[j++]=indices[i];
                                     }
                                 }
                             // 累加求和
                             int outputIdx=result.shape.linearat(newIndices);
-#pragma omp atomic
-                            result.data[outputIdx]*=tensor.data[idx_linear]; }, result.shape.dim);
+ 
+                            result.data[outputIdx]=std::min(result.data[outputIdx],tensor.data[idx_linear]);
+                            }, result.shape.dim);
             }
             else
             {
                 // 如果数据连续（对齐），则可以simd
-                tensor.shape.rangeParallel(tensor.shape.dim - 1, [&tensor, &result, &sumMap](const int i, const std::vector<int> &indices, std::vector<int> &newIndices)
+                tensor.shape.rangeParallel(tensor.shape.dim - 1, [&tensor, &result, &reduced_dims, keepdims](const int i, const std::vector<int> &indices, std::vector<int> &newIndices)
                                            {
                                                // 计算输出索引
 
                                                for (size_t i = 0, j = 0; i < tensor.shape.dim; ++i)
                                                {
-                                                   if (sumMap[i] == 0)
+                                                   if (reduced_dims[i] == 0)
                                                    {
                                                        newIndices[j++] = indices[i];
+                                                   }else if (keepdims && (reduced_dims[i] == 1)) {
+                                                       newIndices[j++] = indices[i];
                                                    }
                                                }
-                                               // 累加求和
+                                               
                                                int outputIdx = result.shape.linearat(newIndices);
 
                                                int shape_last = tensor.shape[-1];
                                                const ScalableTag<T> tag;
                                                const size_t lanes = Lanes(tag);
                                                size_t j = 0;
-                                               T product = 1;
+                                               T mint = tensor.data[i];
                                                // 前部分：处理到对齐
                                                while (j < shape_last && !IsAligned(tag, tensor.data + i + j))
                                                {
-                                                   product *= tensor.data[i + j];
+                                                   mint = std::min(mint,tensor.data[i + j]);
                                                    ++j;
                                                }
 
                                                // 中间部分：SIMD
                                                size_t aligned_end = shape_last - (shape_last % lanes);
-                                               auto product_vec = One(tag); // 初始化累乘向量为1
+                                               auto mint_vec = Load(tag, tensor.data + i + j); // 初始化累乘向量为1
                                                for (; j + lanes <= aligned_end; j += lanes)
                                                {
                                                    auto vec = Load(tag, tensor.data + i + j);
-                                                   product_vec = Mul(product_vec, vec); // 向量累乘
+                                                   mint_vec = Min(mint_vec, vec);  
                                                }
 
                                                // 将向量累乘结果写回
-                                               product *= ReduceMul(tag, product_vec);
+                                               mint = ReduceMin(tag, mint_vec);
 
                                                // 尾部分：处理剩余
                                                for (; j < shape_last; ++j)
                                                {
-                                                   product *= tensor.data[i + j];
+                                                   mint = std::min(mint,tensor.data[i + j]);
                                                }
-#pragma omp atomic
-                                               result.data[outputIdx] *= product; }, result.shape.dim);
+ 
+                                               result.data[outputIdx] = std::min(result.data[outputIdx],mint); 
+                                               }, result.shape.dim);
             }
         }
     };
+
 }
 #endif
\ No newline at end of file
diff --git a/excuter/op-mem-ompsimd/src/deepx/tf/reduce.hpp b/excuter/op-mem-ompsimd/src/deepx/tf/reduce.hpp
new file mode 100644
index 00000000..5e5a873b
--- /dev/null
+++ b/excuter/op-mem-ompsimd/src/deepx/tf/reduce.hpp
@@ -0,0 +1,246 @@
+#ifndef DEEPX_TF_REDUCE_HPP
+#define DEEPX_TF_REDUCE_HPP
+
+#include "deepx/tensor.hpp"
+#include "deepx/tensorfunc/reduce_miaobyte.hpp"
+#include <vector>
+#include "deepx/tf/tf.hpp"
+#include "deepx/dtype.hpp"
+
+namespace deepx::tf
+{
+    template <typename Author>
+    class Sum : public TF
+    {
+    public:
+        Sum(const vector<Param> &args, const vector<Param> &returns)
+        {
+            this->name = "sum";
+            this->author = Author::name();
+            this->args = args;
+            this->returns = returns;
+        }
+
+        string math_formula() const override
+        {
+            return "B = sum(A, axis=[1 2], keepdims=false)";
+        }
+        shared_ptr<TF> clone() const override
+        {
+            return make_shared<Sum>(*this);
+        }
+        int run(shared_ptr<MemBase> mem, string &error) override
+        {
+            Precision input_type = mem->gettensor(this->args[0].textvalue).get()->shape.dtype;
+            vector<int> dims = this->getvector<int>(1, true);
+            bool keepdims = this->getvar<bool>(2,mem,true);
+            Precision output_type = mem->gettensor(this->returns[0].textvalue).get()->shape.dtype;
+            if (input_type != output_type)
+            {
+                error = "Type mismatch: " + precision_str(input_type) + " != " + precision_str(output_type);
+                return 1;
+            }
+            switch (input_type)
+            {
+            case Precision::Float64:
+                sum<Author, double>(*mem->gettensor<double>(this->args[0].textvalue), dims, *mem->gettensor<double>(this->returns[0].textvalue), keepdims);
+                break;
+            case Precision::Float32:
+                sum<Author, float>(*mem->gettensor<float>(this->args[0].textvalue), dims, *mem->gettensor<float>(this->returns[0].textvalue), keepdims);
+                break;
+            case Precision::Int64:
+                sum<Author, int64_t>(*mem->gettensor<int64_t>(this->args[0].textvalue), dims, *mem->gettensor<int64_t>(this->returns[0].textvalue), keepdims);
+                break;
+            case Precision::Int32:
+                sum<Author, int32_t>(*mem->gettensor<int32_t>(this->args[0].textvalue), dims, *mem->gettensor<int32_t>(this->returns[0].textvalue), keepdims);
+                break;
+            case Precision::Int16:
+                sum<Author, int16_t>(*mem->gettensor<int16_t>(this->args[0].textvalue), dims, *mem->gettensor<int16_t>(this->returns[0].textvalue), keepdims);
+                break;
+            case Precision::Int8:
+                sum<Author, int8_t>(*mem->gettensor<int8_t>(this->args[0].textvalue), dims, *mem->gettensor<int8_t>(this->returns[0].textvalue), keepdims);
+                break;
+            default:
+                error = "Unsupported type: " + precision_str(input_type);
+                return 1;
+            }
+            return 0;
+        }
+    };
+
+    template <typename Author>
+    class Prod : public TF
+    {
+    public:
+        Prod(const vector<Param> &args, const vector<Param> &returns)
+        {
+            this->name = "prod";
+            this->author = Author::name();
+            this->args = args;
+            this->returns = returns;
+        }
+        string math_formula() const override
+        {
+            return "B = prod(A, axis=[1 2], keepdims=false)";
+        }
+        shared_ptr<TF> clone() const override
+        {
+            return make_shared<Prod>(*this);
+        }
+        int run(shared_ptr<MemBase> mem, string &error) override
+        {
+            Precision input_type = mem->gettensor(this->args[0].textvalue).get()->shape.dtype;
+            vector<int> dims = this->getvector<int>(1, true);
+            bool keepdims = this->getvar<bool>(2,mem,true);
+            Precision output_type = mem->gettensor(this->returns[0].textvalue).get()->shape.dtype;
+            if (input_type != output_type)
+            {
+                error = "Type mismatch: " + precision_str(input_type) + " != " + precision_str(output_type);
+                return 1;
+            }
+            switch (input_type)
+            {
+            case Precision::Float64:
+                prod<Author, double>(*mem->gettensor<double>(this->args[0].textvalue), dims, *mem->gettensor<double>(this->returns[0].textvalue), keepdims);
+                break;
+            case Precision::Float32:
+                prod<Author, float>(*mem->gettensor<float>(this->args[0].textvalue), dims, *mem->gettensor<float>(this->returns[0].textvalue), keepdims);
+                break;
+            case Precision::Int64:
+                prod<Author, int64_t>(*mem->gettensor<int64_t>(this->args[0].textvalue), dims, *mem->gettensor<int64_t>(this->returns[0].textvalue), keepdims);
+                break;
+            case Precision::Int32:
+                prod<Author, int32_t>(*mem->gettensor<int32_t>(this->args[0].textvalue), dims, *mem->gettensor<int32_t>(this->returns[0].textvalue), keepdims);
+                break;
+            case Precision::Int16:
+                prod<Author, int16_t>(*mem->gettensor<int16_t>(this->args[0].textvalue), dims, *mem->gettensor<int16_t>(this->returns[0].textvalue), keepdims);
+                break;
+            case Precision::Int8:
+                prod<Author, int8_t>(*mem->gettensor<int8_t>(this->args[0].textvalue), dims, *mem->gettensor<int8_t>(this->returns[0].textvalue), keepdims);
+                break;
+            default:
+                error = "Unsupported type: " + precision_str(input_type);
+                return 1;
+            }
+            return 0;
+        }
+    };
+
+        template <typename Author>
+    class ReduceMax : public TF
+    {
+    public:
+        ReduceMax(const vector<Param> &args, const vector<Param> &returns)
+        {
+            this->name = "reducemax";
+            this->author = Author::name();
+            this->args = args;
+            this->returns = returns;
+        }
+        string math_formula() const override
+        {
+            return "B = reducemax(A, axis=[1 2], keepdims=false)";
+        }
+        shared_ptr<TF> clone() const override
+        {
+            return make_shared<ReduceMax>(*this);
+        }
+        int run(shared_ptr<MemBase> mem, string &error) override
+        {
+            Precision input_type = mem->gettensor(this->args[0].textvalue).get()->shape.dtype;
+            vector<int> dims = this->getvector<int>(1, true);
+            bool keepdims = this->getvar<bool>(2,mem,true);
+            Precision output_type = mem->gettensor(this->returns[0].textvalue).get()->shape.dtype;
+            if (input_type != output_type)
+            {
+                error = "Type mismatch: " + precision_str(input_type) + " != " + precision_str(output_type);
+                return 1;
+            }
+            switch (input_type)
+            {
+            case Precision::Float64:
+                reducemax<Author, double>(*mem->gettensor<double>(this->args[0].textvalue), dims, *mem->gettensor<double>(this->returns[0].textvalue), keepdims);
+                break;
+            case Precision::Float32:
+                reducemax<Author, float>(*mem->gettensor<float>(this->args[0].textvalue), dims, *mem->gettensor<float>(this->returns[0].textvalue), keepdims);
+                break;
+            case Precision::Int64:
+                reducemax<Author, int64_t>(*mem->gettensor<int64_t>(this->args[0].textvalue), dims, *mem->gettensor<int64_t>(this->returns[0].textvalue), keepdims);
+                break;
+            case Precision::Int32:
+                reducemax<Author, int32_t>(*mem->gettensor<int32_t>(this->args[0].textvalue), dims, *mem->gettensor<int32_t>(this->returns[0].textvalue), keepdims);
+                break;
+            case Precision::Int16:
+                reducemax<Author, int16_t>(*mem->gettensor<int16_t>(this->args[0].textvalue), dims, *mem->gettensor<int16_t>(this->returns[0].textvalue), keepdims);
+                break;
+            case Precision::Int8:
+                reducemax<Author, int8_t>(*mem->gettensor<int8_t>(this->args[0].textvalue), dims, *mem->gettensor<int8_t>(this->returns[0].textvalue), keepdims);
+                break;
+            default:
+                error = "Unsupported type: " + precision_str(input_type);
+                return 1;
+            }
+            return 0;
+        }
+    };
+
+        template <typename Author>
+    class ReduceMin : public TF
+    {
+    public:
+        ReduceMin(const vector<Param> &args, const vector<Param> &returns)
+        {
+            this->name = "reducemin";
+            this->author = Author::name();
+            this->args = args;
+            this->returns = returns;
+        }
+        string math_formula() const override
+        {
+            return "B = reducemin(A, axis=[1 2], keepdims=false)";
+        }
+        shared_ptr<TF> clone() const override
+        {
+            return make_shared<ReduceMin>(*this);
+        }
+        int run(shared_ptr<MemBase> mem, string &error) override
+        {
+            Precision input_type = mem->gettensor(this->args[0].textvalue).get()->shape.dtype;
+            vector<int> dims = this->getvector<int>(1, true);
+            bool keepdims = this->getvar<bool>(2,mem,true);
+            Precision output_type = mem->gettensor(this->returns[0].textvalue).get()->shape.dtype;
+            if (input_type != output_type)
+            {
+                error = "Type mismatch: " + precision_str(input_type) + " != " + precision_str(output_type);
+                return 1;
+            }
+            switch (input_type)
+            {
+            case Precision::Float64:
+                reducemin<Author, double>(*mem->gettensor<double>(this->args[0].textvalue), dims, *mem->gettensor<double>(this->returns[0].textvalue), keepdims);
+                break;
+            case Precision::Float32:
+                reducemin<Author, float>(*mem->gettensor<float>(this->args[0].textvalue), dims, *mem->gettensor<float>(this->returns[0].textvalue), keepdims);
+                break;
+            case Precision::Int64:
+                reducemin<Author, int64_t>(*mem->gettensor<int64_t>(this->args[0].textvalue), dims, *mem->gettensor<int64_t>(this->returns[0].textvalue), keepdims);
+                break;
+            case Precision::Int32:
+                reducemin<Author, int32_t>(*mem->gettensor<int32_t>(this->args[0].textvalue), dims, *mem->gettensor<int32_t>(this->returns[0].textvalue), keepdims);
+                break;
+            case Precision::Int16:
+                reducemin<Author, int16_t>(*mem->gettensor<int16_t>(this->args[0].textvalue), dims, *mem->gettensor<int16_t>(this->returns[0].textvalue), keepdims);
+                break;
+            case Precision::Int8:
+                reducemin<Author, int8_t>(*mem->gettensor<int8_t>(this->args[0].textvalue), dims, *mem->gettensor<int8_t>(this->returns[0].textvalue), keepdims);
+                break;
+            default:
+                error = "Unsupported type: " + precision_str(input_type);
+                return 1;
+            }
+            return 0;
+        }
+    };
+}
+
+#endif // DEEPX_TF_REDUCE_HPP
diff --git a/excuter/op-mem-ompsimd/src/deepx/tf/reduce.hpp.a b/excuter/op-mem-ompsimd/src/deepx/tf/reduce.hpp.a
deleted file mode 100644
index f3e6b039..00000000
--- a/excuter/op-mem-ompsimd/src/deepx/tf/reduce.hpp.a
+++ /dev/null
@@ -1,73 +0,0 @@
-#ifndef DEEPX_OP_REDUCE_HPP
-#define DEEPX_OP_REDUCE_HPP
-
-#include "deepx/tensor.hpp"
-#include "deepx/tensorfunc/reduce.hpp"
-#include "deepx/tensorfunc/changeshape.hpp"
-#include "stdutil/num.hpp"
-
-namespace deepx::op
-{
-    template <typename T>
-    class Sum : public Op
-    {
-    public:
-        Sum()
-        {
-            this->init("sum", deepx::dtype<T>::name(), {}, {}, false, {}, {});
-        }
-        Sum(vector<string> args, vector<string> returns, bool require_grad = false, vector<string> args_grad = {}, vector<string> returns_grad = {})
-        {
-            this->init("sum", deepx::dtype<T>::name(), args, returns, require_grad, args_grad, returns_grad);
-        }
-        Sum(initializer_list<string> args, initializer_list<string> returns, bool require_grad = false, initializer_list<string> args_grad = {}, initializer_list<string> returns_grad = {})
-        {
-            this->init("sum", deepx::dtype<T>::name(), args, returns, require_grad, args_grad, returns_grad);
-        }
-        void forward(mem::Mem &mem) override
-        {
-            auto A = mem.gettensor<T>(this->args[0]);
-            std::vector<int> dims = mem.getvector<int>(this->args[1]);
-            auto output = mem.gettensor<T>(this->returns[0]);
-            tensorfunc::sum(*A, dims, *output);
-        }
-        void backward(mem::Mem &mem) override
-        {
-            auto output_grad = mem.gettensor<T>(this->returns_grad[0]);
-            auto A_grad = mem.gettensor<T>(this->args_grad[0]);
-
-            tensorfunc::expand(*output_grad, *A_grad);
-        }
-        void setexample() override
-        {
-            this->init("sum", "float32", {"T1", "1", "2"}, {"T2"}, false, {}, {});
-        }
-        string math_formula() const override
-        {
-            return "T2 = sum(T1, dims=[1,2])";
-        }
-    };
-
-
-    // todo
-    template <typename T>
-    class Max_reduce : public Op
-    {
-    public:
-        Max_reduce()
-        {
-            this->init("max_reduce", deepx::dtype<T>::name(), {}, {}, false, {}, {});
-        };
-        void forward(mem::Mem &mem) override
-        {
-        }
-
-        void backward(mem::Mem &mem) override {
-
-        };
-    };
-
-   
-}
-
-#endif
diff --git a/excuter/op-mem-ompsimd/test/tensorfunc/5_tensor_sum.cpp b/excuter/op-mem-ompsimd/test/tensorfunc/5_tensor_sum.cpp
index 02fc55ef..c68e2b8e 100644
--- a/excuter/op-mem-ompsimd/test/tensorfunc/5_tensor_sum.cpp
+++ b/excuter/op-mem-ompsimd/test/tensorfunc/5_tensor_sum.cpp
@@ -11,6 +11,7 @@
 #include "deepx/shape_reduce.hpp"
 #include "deepx/tensorfunc/new.hpp"
 #include "deepx/tensorfunc/init_miaobyte.hpp"
+#include "deepx/tensorfunc/new.hpp"
 #include "deepx/tensorfunc/io_miaobyte.hpp"
 #include "deepx/tensorfunc/authors.hpp"
 
@@ -22,19 +23,20 @@ void test_sum()
 {
     omp_set_num_threads(1); 
 
-    Shape shape({2, 3, 4});
-    deepx::Tensor<float> tensor= New<float>(shape.shape);
+    std::vector<int> shape={2, 3, 4};
+    Tensor<float> tensor= New<float>(shape);
     constant<miaobyte,float>(tensor,float(1));
-    print<miaobyte>(tensor);
+    print<miaobyte>(tensor,"%.0f");
     cout<<""<<endl;
     std::vector<std::vector<int>> result = combination(3);
     for (const auto &comb : result)
     {
         std::cout <<"sum(t,"<< comb <<")"<< std::endl;
-        Shape sumshape=reduceShape(shape,comb);
-        Tensor<float> r = New<float>(sumshape.shape);
-        sum<miaobyte,float>(tensor, comb,r);
-        print<miaobyte>(r);
+        std::vector<int> checkeddims=checkedDims(shape,comb);
+        std::vector<int> sumshape=reducedShape(shape,checkeddims);
+        Tensor<float> r = New<float>(sumshape);
+        sum<miaobyte,float>(tensor, checkeddims,r);
+        print<miaobyte>(r,"%.0f");
     }
 /*
 []=>[2, 3, 4]
@@ -49,18 +51,26 @@ void test_sum()
 }
 
 void benchmark_sum(int i){
-    Shape shape({i,i,i});
-    deepx::Tensor<float> tensor= New<float>(shape.shape);
+    std::vector<int> shape={i,i,i};
+    deepx::Tensor<float> tensor= New<float>(shape);
     std::iota(tensor.data ,tensor.data+tensor.shape.size,0);
     std::vector<std::vector<int>> result = combination(3);
-     std::cout<<"sum "<<shape.shape<<"=>";
-     auto start = std::chrono::high_resolution_clock::now();
+    std::cout<<"sum "<<shape<<"=>";
+    auto start = std::chrono::high_resolution_clock::now();
     for (const auto &comb : result)
     {
-        Shape sShape = reduceShape(shape, comb);
-        Tensor<float> r=New<float>(sShape.shape);
-        sum<miaobyte,float>(tensor, comb,r);
-        save<miaobyte>(r,"5_tensor_sum"+std::to_string(i)+"result");
+        std::cout <<"sum(t,"<< comb <<")"<< std::endl;
+        std::vector<int> checkeddims=checkedDims(shape,comb);
+        std::vector<int> sumshape=reducedShape(shape,checkeddims);
+        Tensor<float> r=New<float>(sumshape);
+        sum<miaobyte,float>(tensor, checkeddims,r);
+        string combstr="";
+        for (const auto &c : comb)
+        {
+            combstr+=std::to_string(c)+"_";
+        }
+        save<miaobyte>(r,"5_tensor_sum."+ combstr);
+        print<miaobyte>(r,"%.0f");
     }
     auto end=std::chrono::high_resolution_clock::now();
     std::chrono::duration<double> duration = end - start;
diff --git a/excuter/op-mem-ompsimd/test/tensorfunc/7_tensor_transpose.cpp b/excuter/op-mem-ompsimd/test/tensorfunc/7_tensor_transpose.cpp
index d843b6e1..a97fbcd7 100644
--- a/excuter/op-mem-ompsimd/test/tensorfunc/7_tensor_transpose.cpp
+++ b/excuter/op-mem-ompsimd/test/tensorfunc/7_tensor_transpose.cpp
@@ -9,7 +9,7 @@
 #include "deepx/tensorfunc/io_miaobyte.hpp"
 #include "stdutil/vector.hpp"
 #include "tensorutil.hpp"
-#include "deepx/shape_transpose.hpp"
+#include "deepx/shape_changeshape.hpp"
 
 using namespace deepx::tensorfunc;
 using namespace deepx;
diff --git a/excuter/op-mem-ompsimd/test/tensorfunc/8_tensor_concat.cpp b/excuter/op-mem-ompsimd/test/tensorfunc/8_tensor_concat.cpp
index 9456e408..0922d9bc 100644
--- a/excuter/op-mem-ompsimd/test/tensorfunc/8_tensor_concat.cpp
+++ b/excuter/op-mem-ompsimd/test/tensorfunc/8_tensor_concat.cpp
@@ -6,7 +6,7 @@
 #include "deepx/tensorfunc/changeshape_miaobyte.hpp"
 #include "deepx/tensor.hpp"
 #include "deepx/shape.hpp"
-#include "deepx/shape_concat.hpp"
+#include "deepx/shape_changeshape.hpp"
 #include "deepx/tensorfunc/new.hpp"
 #include "deepx/tensorfunc/init_miaobyte.hpp"
 #include "deepx/tensorfunc/io_miaobyte.hpp"
diff --git a/front/py/deepx/nn/functional/init.py b/front/py/deepx/nn/functional/init.py
index 74581339..77383dda 100644
--- a/front/py/deepx/nn/functional/init.py
+++ b/front/py/deepx/nn/functional/init.py
@@ -50,23 +50,17 @@ def ones(*size, dtype=None, device=None,
 class Arange(Function):
     @staticmethod
     def forward(ctx:Context,
+                t:Tensor,
                 start:Optional[Union[float,int]]=0,
-                end:Optional[Union[float,int]]=None,
-                step:Optional[Union[float,int]]=1,dtype=None, device=None,name:Union[Tensor,str]='',author='miaobyte')->Tensor:
-        outtensor=None
-        if isinstance(name,str):
-            shape=[end-start]
-            outtensor=Tensor(shape=shape, dtype=dtype, device=device)
-            outtensor.addtograph(name)
-        else:
-            outtensor=name
-        g=outtensor.graph
+                step:Optional[Union[float,int]]=1,
+                author='miaobyte')->Tensor:
+        g=t.graph
         if g.eager:
-            ir=DeepxIR("arange",  [outtensor.node.name,start,step], [],author)
+            ir=DeepxIR("arange",[t.node.name,start,step], [],author)
             send(ir)
-        return outtensor
-def arange(start=0, end=None, step=1,dtype=None, device=None,name:Union[Tensor,str]='',author='miaobyte')->Tensor:
-    return Arange.apply(start,end,step,dtype,device,name,author)
+        return t
+def arange(t:Tensor,start=0,step=1,author='miaobyte')->Tensor:
+    return Arange.apply(t,start,step,author)
 
 OpNode.register("uniform")
 class Uniform(Function):
diff --git a/front/py/deepx/nn/functional/reduce.py b/front/py/deepx/nn/functional/reduce.py
index 12dcaefe..10051348 100644
--- a/front/py/deepx/nn/functional/reduce.py
+++ b/front/py/deepx/nn/functional/reduce.py
@@ -1,10 +1,9 @@
 from typing import Optional, Union
 
 from deepx.tensor import Tensor
-from deepx.autograd.graph import OpNode
 from deepx.nn.deepxir import DeepxIR    
 from deepx.scheduler import send
-from .elementwise import _A_b_elementwiseop_C
+from deepx.autograd import OpNode,Function,Context
 
 def reduceshape(inshape: Union[list[int], tuple[int]], 
                dim: Union[list[int], tuple[int]], 
@@ -40,10 +39,11 @@ def reduceshape(inshape: Union[list[int], tuple[int]],
 
 def _A_v_reduceop_C(
         a:Tensor,
-        dim: Union[list[int],tuple[int]] = [],
+        dim: Union[list[int],tuple[int]]=None,
         keepdim:bool=False,
         op:str=None,
-        out:Union[Tensor,str]='')->Tensor:
+        out:Union[Tensor,str]='',
+        author:str='miaobyte')->Tensor:
     
     if dim is None:
         dim=list(range(a.ndim))
@@ -63,36 +63,26 @@ def _A_v_reduceop_C(
     result.node.add_input(opnode)
 
     if a.graph.eager:
-        args = [*dim, "keepdim"] if keepdim else [*dim]
-        varir=DeepxIR("argset",'int32', args, [vector_node.name])
-
-        send(varir)
-        ir=DeepxIR(op, a.dtype, [a.node.name,vector_node.name], [result.node.name])
+        ir=DeepxIR(op, [a.node.name,dim,"true" if keepdim else "false"], [result.node.name],author)
         send(ir)
     return result
-
-#max
-
-OpNode.register("reducemax")
-def reduce_max(
-        a:Tensor,
-        dim:list[int] = None,
-        keepdim=False,
-        out:Union[Tensor,str]='')->Tensor:
-    return _A_v_reduceop_C(a,dim,keepdim,"max",out)
- 
-#min    
-OpNode.register("reducemin")
-def reduce_min(
-        a:Tensor,
-        dim:list[int] = None,
-        keepdim=False,
-        out:Union[Tensor,str]='')->Tensor:
-    return _A_v_reduceop_C(a,dim,keepdim,"min",out)
-    
- 
 #sum    
 OpNode.register("sum")
+class Sum(Function):
+    @staticmethod
+    def forward(ctx:Context,a:Tensor,dim:Optional[Union[list[int],tuple[int]]]=None,keepdim:bool=False,out:Union[Tensor,str]='',author:str='miaobyte')->Tensor:
+        if ctx.requires_grad:
+            ctx.save_tensors('a',a)
+            ctx.save_data('dim',dim)
+            ctx.save_data('keepdim',keepdim)
+        return _A_v_reduceop_C(a,dim,keepdim,"sum",out,author)
+    
+    @staticmethod
+    def backward(ctx:Context,out_grad):
+        pass
+    
+    
+
 def sum(
         a:Tensor,
         dim:Optional[Union[
@@ -100,11 +90,22 @@ def sum(
             tuple[int],
             ]]=None,
         keepdim:bool=False,
-        out:Union[Tensor,str]='')->Tensor:
-    return _A_v_reduceop_C(a,dim,keepdim,"sum",out)
+        out:Union[Tensor,str]='',
+        author:str='miaobyte',
+        requires_grad:bool=False)->Tensor:
+    return Sum.apply(a,dim,keepdim,out,author,requires_grad=requires_grad)
 
 #prod
 OpNode.register("prod")
+class Prod(Function):
+    @staticmethod
+    def forward(ctx:Context,a:Tensor,dim:Optional[Union[list[int],tuple[int]]]=None,keepdim:bool=False,out:Union[Tensor,str]='',author:str='miaobyte')->Tensor:
+        return _A_v_reduceop_C(a,dim,keepdim,"prod",out,author)
+    
+    @staticmethod
+    def backward(ctx:Context,out_grad):
+        pass
+
 def prod(
         a:Tensor,
         dim:Optional[Union[
@@ -112,8 +113,50 @@ def prod(
             tuple[int],
             ]]=None,
         keepdim:bool=False,
-        out:Union[Tensor,str]='')->Tensor:
-    return _A_v_reduceop_C(a,dim,keepdim,"prod",out)
+        out:Union[Tensor,str]='',
+        author:str='miaobyte',
+        requires_grad:bool=False)->Tensor:
+    return Prod.apply(a,dim,keepdim,out,author,requires_grad=requires_grad)
+
+#max
+OpNode.register("reducemax")
+class ReduceMax(Function):
+    @staticmethod
+    def forward(ctx:Context,a:Tensor,dim:Optional[Union[list[int],tuple[int]]]=None,keepdim:bool=False,out:Union[Tensor,str]='',author:str='miaobyte')->Tensor:
+        return _A_v_reduceop_C(a,dim,keepdim,"reducemax",out,author)
+    
+    @staticmethod
+    def backward(ctx:Context,out_grad):
+        pass
+def reduce_max(
+        a:Tensor,
+        dim:list[int] = None,
+        keepdim=False,
+        out:Union[Tensor,str]='',
+        author:str='miaobyte',
+        requires_grad:bool=False)->Tensor:
+    return ReduceMax.apply(a,dim,keepdim,out,author,requires_grad=requires_grad)
+ 
+#min    
+OpNode.register("reducemin")
+class ReduceMin(Function):
+    @staticmethod
+    def forward(ctx:Context,a:Tensor,dim:Optional[Union[list[int],tuple[int]]]=None,keepdim:bool=False,out:Union[Tensor,str]='',author:str='miaobyte')->Tensor:
+        return _A_v_reduceop_C(a,dim,keepdim,"reducemin",out,author)
+    
+    @staticmethod
+    def backward(ctx:Context,out_grad):
+        pass
+def reduce_min(
+        a:Tensor,
+        dim:list[int] = None,
+        keepdim=False,
+        out:Union[Tensor,str]='',
+        author:str='miaobyte',
+        requires_grad:bool=False)->Tensor:
+    return ReduceMin.apply(a,dim,keepdim,out,author,requires_grad=requires_grad)
+    
+ 
 
 #mean
 OpNode.register("mean")
@@ -136,5 +179,3 @@ def mean(
         total *= a.shape[i]
     result = sum(a, dim, keepdim, out)/total
     return result
-# #var
-# OpNode.register("var")
\ No newline at end of file
diff --git a/front/py/deepx/tensor/init.py b/front/py/deepx/tensor/init.py
index a6c44f72..f5738829 100644
--- a/front/py/deepx/tensor/init.py
+++ b/front/py/deepx/tensor/init.py
@@ -31,9 +31,9 @@ def randn_(self):
     pass
 
 @tensor_method
-def arange_(self,start,end=None,step=1):
-    #todo
-    pass
+def arange_(self,start=0,step=1,author='miaobyte'):
+    from deepx.nn.functional import arange as arange_func
+    arange_func(self,start,step,author)
 
 @tensor_method
 def eye_(self,n,m=None):
diff --git a/front/py/deepx/tensor/tensor.py b/front/py/deepx/tensor/tensor.py
index 7c91ab88..91fa8f7d 100644
--- a/front/py/deepx/tensor/tensor.py
+++ b/front/py/deepx/tensor/tensor.py
@@ -29,6 +29,14 @@ def __init__(
                 self._dtype = default_dtype
         else:
             self._dtype = str(dtype)
+        
+        # format
+        if self._dtype == 'float32' or self._dtype == 'float64' or self._dtype == 'float16' or self._dtype == 'bfloat16':
+            self._format = '%.4f'
+        elif self._dtype == 'int32' or self._dtype == 'int64' or self._dtype == 'int8' or self._dtype == 'int16':
+            self._format = '%d'
+        else:
+            self._format = '%s'
         # shape
         if shape is not None:
             if isinstance(shape, (tuple, list)) and all(isinstance(i, int) for i in shape):
@@ -145,9 +153,12 @@ def __matmul__(self, other):
     def T(self) -> str:
         return self.transpose(1,0,out=self.node.name+".T")
 
+    # 打印
+    def set_format(self,format:str):
+        self._format = format
     def __repr__(self) -> str:
         from deepx.nn.functional import printtensor
-        s=printtensor(self)
+        s=printtensor(self,format=self._format)
         return s
 
 
diff --git a/front/py/examples/2_ir/4_changeshape_broadcast.dot b/front/py/examples/2_ir/4_changeshape_broadcast.dot
index d58501d9..63f24c90 100644
--- a/front/py/examples/2_ir/4_changeshape_broadcast.dot
+++ b/front/py/examples/2_ir/4_changeshape_broadcast.dot
@@ -2,34 +2,34 @@
 digraph {
 	rankdir=TB
 	node [shape=record]
-	139260210680960 [label="a
+	139182860375312 [label="a
 (4, 2, 3)" color=skyblue fillcolor=aliceblue fontname="Sans-Serif" labeljust=l shape=box style=filled]
-	139258236846528 [label=reshape color=darkslategray fillcolor=lightgray fontname="Courier Bold" labeljust=l shape=box style=filled]
-	139260210690752 [label="vector_1
+	139181167609744 [label=reshape color=darkslategray fillcolor=lightgray fontname="Courier Bold" labeljust=l shape=box style=filled]
+	139182860384960 [label="vector_1
 (4, 2, 3)" color=darkseagreen fillcolor=honeydew fontname="Sans-Serif" labeljust=l shape=box style=filled]
-	139258235360000 [label="b
+	139181166122448 [label="b
 (2, 1)" color=skyblue fillcolor=aliceblue fontname="Sans-Serif" labeljust=l shape=box style=filled]
-	139258235359616 [label=reshape color=darkslategray fillcolor=lightgray fontname="Courier Bold" labeljust=l shape=box style=filled]
-	139258235359856 [label="vector_2
+	139181166122592 [label=reshape color=darkslategray fillcolor=lightgray fontname="Courier Bold" labeljust=l shape=box style=filled]
+	139181166122688 [label="vector_2
 (2, 1)" color=darkseagreen fillcolor=honeydew fontname="Sans-Serif" labeljust=l shape=box style=filled]
-	139258235360048 [label="b.broadcasted
+	139181166122736 [label="b.broadcasted
 (4, 2, 3)" color=skyblue fillcolor=aliceblue fontname="Sans-Serif" labeljust=l shape=box style=filled]
-	139258235360096 [label=broadcastTo color=darkslategray fillcolor=lightgray fontname="Courier Bold" labeljust=l shape=box style=filled]
-	139258235360576 [label="vector_3
+	139181166123168 [label=broadcastTo color=darkslategray fillcolor=lightgray fontname="Courier Bold" labeljust=l shape=box style=filled]
+	139181166122928 [label="vector_3
 (4, 2, 3)" color=darkseagreen fillcolor=honeydew fontname="Sans-Serif" labeljust=l shape=box style=filled]
-	139258235360240 [label=add color=darkslategray fillcolor=lightgray fontname="Courier Bold" labeljust=l shape=box style=filled]
-	139258235360480 [label="tensor_4
+	139181166123216 [label=add color=darkslategray fillcolor=lightgray fontname="Courier Bold" labeljust=l shape=box style=filled]
+	139181166123264 [label="tensor_4
 (4, 2, 3)" color=skyblue fillcolor=aliceblue fontname="Sans-Serif" labeljust=l shape=box style=filled]
-	139258236846528 -> 139260210680960 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	139260210680960 -> 139258236846528 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	139260210690752 -> 139258236846528 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	139258235359616 -> 139258235360000 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	139258235360000 -> 139258235359616 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	139258235359856 -> 139258235359616 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	139258235360096 -> 139258235360048 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	139258235360000 -> 139258235360096 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	139258235360576 -> 139258235360096 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	139260210680960 -> 139258235360240 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	139258235360048 -> 139258235360240 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	139258235360240 -> 139258235360480 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	139181167609744 -> 139182860375312 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	139182860375312 -> 139181167609744 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	139182860384960 -> 139181167609744 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	139181166122592 -> 139181166122448 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	139181166122448 -> 139181166122592 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	139181166122688 -> 139181166122592 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	139181166123168 -> 139181166122736 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	139181166122448 -> 139181166123168 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	139181166122928 -> 139181166123168 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	139182860375312 -> 139181166123216 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	139181166122736 -> 139181166123216 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	139181166123216 -> 139181166123264 [arrowsize=0.8 color=gray40 penwidth=1.2]
 }
diff --git a/front/py/examples/2_ir/4_changeshape_broadcast.dot.svg b/front/py/examples/2_ir/4_changeshape_broadcast.dot.svg
index 293e8a9a..5ee163ac 100644
--- a/front/py/examples/2_ir/4_changeshape_broadcast.dot.svg
+++ b/front/py/examples/2_ir/4_changeshape_broadcast.dot.svg
@@ -9,148 +9,148 @@
 <g id="graph0" class="graph" transform="scale(1 1) rotate(0) translate(4 334)">
 <title>%3</title>
 <polygon fill="white" stroke="transparent" points="-4,4 -4,-334 285.5,-334 285.5,4 -4,4"/>
-<!-- 139260210680960 -->
+<!-- 139182860375312 -->
 <g id="node1" class="node">
-<title>139260210680960</title>
+<title>139182860375312</title>
 <polygon fill="aliceblue" stroke="skyblue" points="152,-184 90,-184 90,-146 152,-146 152,-184"/>
 <text text-anchor="middle" x="121" y="-168.8" font-family="Sans-Serif" font-size="14.00">a</text>
 <text text-anchor="middle" x="121" y="-153.8" font-family="Sans-Serif" font-size="14.00">(4, 2, 3)</text>
 </g>
-<!-- 139258236846528 -->
+<!-- 139181167609744 -->
 <g id="node2" class="node">
-<title>139258236846528</title>
+<title>139181167609744</title>
 <polygon fill="lightgray" stroke="darkslategray" points="158,-110 84,-110 84,-74 158,-74 158,-110"/>
 <text text-anchor="middle" x="121" y="-88.3" font-family="Courier Bold" font-size="14.00">reshape</text>
 </g>
-<!-- 139260210680960&#45;&gt;139258236846528 -->
+<!-- 139182860375312&#45;&gt;139181167609744 -->
 <g id="edge2" class="edge">
-<title>139260210680960&#45;&gt;139258236846528</title>
+<title>139182860375312&#45;&gt;139181167609744</title>
 <path fill="none" stroke="#666666" stroke-width="1.2" d="M115.01,-145.72C114.2,-137.29 114.04,-127.15 114.52,-118.02"/>
 <polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="117.31,-118.2 115.14,-110 111.73,-117.76 117.31,-118.2"/>
 </g>
-<!-- 139258235360240 -->
+<!-- 139181166123216 -->
 <g id="node10" class="node">
-<title>139258235360240</title>
+<title>139181166123216</title>
 <polygon fill="lightgray" stroke="darkslategray" points="241,-110 187,-110 187,-74 241,-74 241,-110"/>
 <text text-anchor="middle" x="214" y="-88.3" font-family="Courier Bold" font-size="14.00">add</text>
 </g>
-<!-- 139260210680960&#45;&gt;139258235360240 -->
+<!-- 139182860375312&#45;&gt;139181166123216 -->
 <g id="edge10" class="edge">
-<title>139260210680960&#45;&gt;139258235360240</title>
+<title>139182860375312&#45;&gt;139181166123216</title>
 <path fill="none" stroke="#666666" stroke-width="1.2" d="M144.95,-145.72C157.23,-136.34 172.28,-124.85 185.2,-114.99"/>
 <polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="187.07,-117.08 191.73,-110 183.67,-112.63 187.07,-117.08"/>
 </g>
-<!-- 139258236846528&#45;&gt;139260210680960 -->
+<!-- 139181167609744&#45;&gt;139182860375312 -->
 <g id="edge1" class="edge">
-<title>139258236846528&#45;&gt;139260210680960</title>
+<title>139181167609744&#45;&gt;139182860375312</title>
 <path fill="none" stroke="#666666" stroke-width="1.2" d="M126.86,-110C127.73,-118.25 127.96,-128.35 127.55,-137.57"/>
 <polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="124.75,-137.54 126.99,-145.72 130.33,-137.93 124.75,-137.54"/>
 </g>
-<!-- 139260210690752 -->
+<!-- 139182860384960 -->
 <g id="node3" class="node">
-<title>139260210690752</title>
+<title>139182860384960</title>
 <polygon fill="honeydew" stroke="darkseagreen" points="72,-184 0,-184 0,-146 72,-146 72,-184"/>
 <text text-anchor="middle" x="36" y="-168.8" font-family="Sans-Serif" font-size="14.00">vector_1</text>
 <text text-anchor="middle" x="36" y="-153.8" font-family="Sans-Serif" font-size="14.00">(4, 2, 3)</text>
 </g>
-<!-- 139260210690752&#45;&gt;139258236846528 -->
+<!-- 139182860384960&#45;&gt;139181167609744 -->
 <g id="edge3" class="edge">
-<title>139260210690752&#45;&gt;139258236846528</title>
+<title>139182860384960&#45;&gt;139181167609744</title>
 <path fill="none" stroke="#666666" stroke-width="1.2" d="M57.89,-145.72C69.01,-136.42 82.62,-125.06 94.35,-115.26"/>
 <polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="96.3,-117.28 100.64,-110 92.71,-112.98 96.3,-117.28"/>
 </g>
-<!-- 139258235360000 -->
+<!-- 139181166122448 -->
 <g id="node4" class="node">
-<title>139258235360000</title>
+<title>139181166122448</title>
 <polygon fill="aliceblue" stroke="skyblue" points="158,-330 104,-330 104,-292 158,-292 158,-330"/>
 <text text-anchor="middle" x="131" y="-314.8" font-family="Sans-Serif" font-size="14.00">b</text>
 <text text-anchor="middle" x="131" y="-299.8" font-family="Sans-Serif" font-size="14.00">(2, 1)</text>
 </g>
-<!-- 139258235359616 -->
+<!-- 139181166122592 -->
 <g id="node5" class="node">
-<title>139258235359616</title>
+<title>139181166122592</title>
 <polygon fill="lightgray" stroke="darkslategray" points="154,-256 80,-256 80,-220 154,-220 154,-256"/>
 <text text-anchor="middle" x="117" y="-234.3" font-family="Courier Bold" font-size="14.00">reshape</text>
 </g>
-<!-- 139258235360000&#45;&gt;139258235359616 -->
+<!-- 139181166122448&#45;&gt;139181166122592 -->
 <g id="edge5" class="edge">
-<title>139258235360000&#45;&gt;139258235359616</title>
+<title>139181166122448&#45;&gt;139181166122592</title>
 <path fill="none" stroke="#666666" stroke-width="1.2" d="M121.41,-291.72C118.93,-283.29 116.77,-273.15 115.45,-264.02"/>
 <polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="118.22,-263.61 114.49,-256 112.66,-264.28 118.22,-263.61"/>
 </g>
-<!-- 139258235360096 -->
+<!-- 139181166123168 -->
 <g id="node8" class="node">
-<title>139258235360096</title>
+<title>139181166123168</title>
 <polygon fill="lightgray" stroke="darkslategray" points="279.5,-256 172.5,-256 172.5,-220 279.5,-220 279.5,-256"/>
 <text text-anchor="middle" x="226" y="-234.3" font-family="Courier Bold" font-size="14.00">broadcastTo</text>
 </g>
-<!-- 139258235360000&#45;&gt;139258235360096 -->
+<!-- 139181166122448&#45;&gt;139181166123168 -->
 <g id="edge8" class="edge">
-<title>139258235360000&#45;&gt;139258235360096</title>
+<title>139181166122448&#45;&gt;139181166123168</title>
 <path fill="none" stroke="#666666" stroke-width="1.2" d="M155.46,-291.72C168.01,-282.34 183.39,-270.85 196.58,-260.99"/>
 <polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="198.52,-263.04 203.25,-256 195.16,-258.55 198.52,-263.04"/>
 </g>
-<!-- 139258235359616&#45;&gt;139258235360000 -->
+<!-- 139181166122592&#45;&gt;139181166122448 -->
 <g id="edge4" class="edge">
-<title>139258235359616&#45;&gt;139258235360000</title>
+<title>139181166122592&#45;&gt;139181166122448</title>
 <path fill="none" stroke="#666666" stroke-width="1.2" d="M126.21,-256C128.71,-264.25 130.93,-274.35 132.34,-283.57"/>
 <polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="129.59,-284.14 133.38,-291.72 135.14,-283.42 129.59,-284.14"/>
 </g>
-<!-- 139258235359856 -->
+<!-- 139181166122688 -->
 <g id="node6" class="node">
-<title>139258235359856</title>
+<title>139181166122688</title>
 <polygon fill="honeydew" stroke="darkseagreen" points="86,-330 14,-330 14,-292 86,-292 86,-330"/>
 <text text-anchor="middle" x="50" y="-314.8" font-family="Sans-Serif" font-size="14.00">vector_2</text>
 <text text-anchor="middle" x="50" y="-299.8" font-family="Sans-Serif" font-size="14.00">(2, 1)</text>
 </g>
-<!-- 139258235359856&#45;&gt;139258235359616 -->
+<!-- 139181166122688&#45;&gt;139181166122592 -->
 <g id="edge6" class="edge">
-<title>139258235359856&#45;&gt;139258235359616</title>
+<title>139181166122688&#45;&gt;139181166122592</title>
 <path fill="none" stroke="#666666" stroke-width="1.2" d="M67.25,-291.72C75.78,-282.68 86.15,-271.69 95.22,-262.08"/>
 <polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="97.5,-263.74 100.95,-256 93.43,-259.9 97.5,-263.74"/>
 </g>
-<!-- 139258235360048 -->
+<!-- 139181166122736 -->
 <g id="node7" class="node">
-<title>139258235360048</title>
+<title>139181166122736</title>
 <polygon fill="aliceblue" stroke="skyblue" points="281.5,-184 170.5,-184 170.5,-146 281.5,-146 281.5,-184"/>
 <text text-anchor="middle" x="226" y="-168.8" font-family="Sans-Serif" font-size="14.00">b.broadcasted</text>
 <text text-anchor="middle" x="226" y="-153.8" font-family="Sans-Serif" font-size="14.00">(4, 2, 3)</text>
 </g>
-<!-- 139258235360048&#45;&gt;139258235360240 -->
+<!-- 139181166122736&#45;&gt;139181166123216 -->
 <g id="edge11" class="edge">
-<title>139258235360048&#45;&gt;139258235360240</title>
+<title>139181166122736&#45;&gt;139181166123216</title>
 <path fill="none" stroke="#666666" stroke-width="1.2" d="M222.91,-145.72C221.48,-137.29 219.77,-127.15 218.23,-118.02"/>
 <polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="220.97,-117.42 216.87,-110 215.45,-118.36 220.97,-117.42"/>
 </g>
-<!-- 139258235360096&#45;&gt;139258235360048 -->
+<!-- 139181166123168&#45;&gt;139181166122736 -->
 <g id="edge7" class="edge">
-<title>139258235360096&#45;&gt;139258235360048</title>
+<title>139181166123168&#45;&gt;139181166122736</title>
 <path fill="none" stroke="#666666" stroke-width="1.2" d="M226,-219.81C226,-211.52 226,-201.39 226,-192.16"/>
 <polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="228.8,-192.02 226,-184.02 223.2,-192.02 228.8,-192.02"/>
 </g>
-<!-- 139258235360576 -->
+<!-- 139181166122928 -->
 <g id="node9" class="node">
-<title>139258235360576</title>
+<title>139181166122928</title>
 <polygon fill="honeydew" stroke="darkseagreen" points="262,-330 190,-330 190,-292 262,-292 262,-330"/>
 <text text-anchor="middle" x="226" y="-314.8" font-family="Sans-Serif" font-size="14.00">vector_3</text>
 <text text-anchor="middle" x="226" y="-299.8" font-family="Sans-Serif" font-size="14.00">(4, 2, 3)</text>
 </g>
-<!-- 139258235360576&#45;&gt;139258235360096 -->
+<!-- 139181166122928&#45;&gt;139181166123168 -->
 <g id="edge9" class="edge">
-<title>139258235360576&#45;&gt;139258235360096</title>
+<title>139181166122928&#45;&gt;139181166123168</title>
 <path fill="none" stroke="#666666" stroke-width="1.2" d="M226,-291.72C226,-283.29 226,-273.15 226,-264.02"/>
 <polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="228.8,-264 226,-256 223.2,-264 228.8,-264"/>
 </g>
-<!-- 139258235360480 -->
+<!-- 139181166123264 -->
 <g id="node11" class="node">
-<title>139258235360480</title>
+<title>139181166123264</title>
 <polygon fill="aliceblue" stroke="skyblue" points="250.5,-38 177.5,-38 177.5,0 250.5,0 250.5,-38"/>
 <text text-anchor="middle" x="214" y="-22.8" font-family="Sans-Serif" font-size="14.00">tensor_4</text>
 <text text-anchor="middle" x="214" y="-7.8" font-family="Sans-Serif" font-size="14.00">(4, 2, 3)</text>
 </g>
-<!-- 139258235360240&#45;&gt;139258235360480 -->
+<!-- 139181166123216&#45;&gt;139181166123264 -->
 <g id="edge12" class="edge">
-<title>139258235360240&#45;&gt;139258235360480</title>
+<title>139181166123216&#45;&gt;139181166123264</title>
 <path fill="none" stroke="#666666" stroke-width="1.2" d="M214,-73.81C214,-65.52 214,-55.39 214,-46.16"/>
 <polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="216.8,-46.02 214,-38.02 211.2,-46.02 216.8,-46.02"/>
 </g>
diff --git a/front/py/examples/2_ir/5_reduce_sum.dot b/front/py/examples/2_ir/5_reduce_sum.dot
deleted file mode 100644
index 9670e4f4..00000000
--- a/front/py/examples/2_ir/5_reduce_sum.dot
+++ /dev/null
@@ -1,41 +0,0 @@
-// Computational Graph
-digraph {
-	rankdir=TB
-	node [shape=record]
-	137431348365008 [label="t
-(3, 4, 5)" color=skyblue fillcolor=aliceblue fontname="Sans-Serif" labeljust=l shape=box style=filled]
-	137429052759232 [label=uniform color=darkslategray fillcolor=lightgray fontname="Courier Bold" labeljust=l shape=box style=filled]
-	137431348378688 [label="var_1
--1" color=orange fillcolor=moccasin fontname="Sans-Serif" labeljust=l shape=box style=filled]
-	137429052765232 [label="var_2
-1" color=orange fillcolor=moccasin fontname="Sans-Serif" labeljust=l shape=box style=filled]
-	137429050978992 [label="var_3
-0" color=orange fillcolor=moccasin fontname="Sans-Serif" labeljust=l shape=box style=filled]
-	137429050978752 [label="s
-(4,)" color=skyblue fillcolor=aliceblue fontname="Sans-Serif" labeljust=l shape=box style=filled]
-	137429050978800 [label="vector_1
-[0, 2]" color=darkseagreen fillcolor=honeydew fontname="Sans-Serif" labeljust=l shape=box style=filled]
-	137429050979232 [label=sum color=darkslategray fillcolor=lightgray fontname="Courier Bold" labeljust=l shape=box style=filled]
-	137429050979184 [label="t1
-(4, 5, 6)" color=skyblue fillcolor=aliceblue fontname="Sans-Serif" labeljust=l shape=box style=filled]
-	137429050979568 [label=constant color=darkslategray fillcolor=lightgray fontname="Courier Bold" labeljust=l shape=box style=filled]
-	137429050979520 [label="var_4
-1" color=orange fillcolor=moccasin fontname="Sans-Serif" labeljust=l shape=box style=filled]
-	137429050979664 [label="t2
-(6,)" color=skyblue fillcolor=aliceblue fontname="Sans-Serif" labeljust=l shape=box style=filled]
-	137429050979952 [label="vector_2
-[0, 1]" color=darkseagreen fillcolor=honeydew fontname="Sans-Serif" labeljust=l shape=box style=filled]
-	137429050980048 [label=sum color=darkslategray fillcolor=lightgray fontname="Courier Bold" labeljust=l shape=box style=filled]
-	137429052759232 -> 137431348365008 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	137431348378688 -> 137429052759232 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	137429052765232 -> 137429052759232 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	137429050978992 -> 137429052759232 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	137429050979232 -> 137429050978752 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	137431348365008 -> 137429050979232 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	137429050978800 -> 137429050979232 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	137429050979568 -> 137429050979184 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	137429050979520 -> 137429050979568 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	137429050980048 -> 137429050979664 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	137429050979184 -> 137429050980048 [arrowsize=0.8 color=gray40 penwidth=1.2]
-	137429050979952 -> 137429050980048 [arrowsize=0.8 color=gray40 penwidth=1.2]
-}
diff --git a/front/py/examples/2_ir/5_reduce_sum.dot.svg b/front/py/examples/2_ir/5_reduce_sum.dot.svg
deleted file mode 100644
index cc43c7f4..00000000
--- a/front/py/examples/2_ir/5_reduce_sum.dot.svg
+++ /dev/null
@@ -1,179 +0,0 @@
-<?xml version="1.0" encoding="UTF-8" standalone="no"?>
-<!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN"
- "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd">
-<!-- Generated by graphviz version 2.43.0 (0)
- -->
-<!-- Title: %3 Pages: 1 -->
-<svg width="341pt" height="338pt"
- viewBox="0.00 0.00 340.50 338.00" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink">
-<g id="graph0" class="graph" transform="scale(1 1) rotate(0) translate(4 334)">
-<title>%3</title>
-<polygon fill="white" stroke="transparent" points="-4,4 -4,-334 336.5,-334 336.5,4 -4,4"/>
-<!-- 137431348365008 -->
-<g id="node1" class="node">
-<title>137431348365008</title>
-<polygon fill="aliceblue" stroke="skyblue" points="152,-184 90,-184 90,-146 152,-146 152,-184"/>
-<text text-anchor="middle" x="121" y="-168.8" font-family="Sans-Serif" font-size="14.00">t</text>
-<text text-anchor="middle" x="121" y="-153.8" font-family="Sans-Serif" font-size="14.00">(3, 4, 5)</text>
-</g>
-<!-- 137429050979232 -->
-<g id="node8" class="node">
-<title>137429050979232</title>
-<polygon fill="lightgray" stroke="darkslategray" points="106,-110 52,-110 52,-74 106,-74 106,-110"/>
-<text text-anchor="middle" x="79" y="-88.3" font-family="Courier Bold" font-size="14.00">sum</text>
-</g>
-<!-- 137431348365008&#45;&gt;137429050979232 -->
-<g id="edge6" class="edge">
-<title>137431348365008&#45;&gt;137429050979232</title>
-<path fill="none" stroke="#666666" stroke-width="1.2" d="M110.18,-145.72C104.99,-136.94 98.71,-126.31 93.14,-116.91"/>
-<polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="95.54,-115.46 89.06,-110 90.72,-118.31 95.54,-115.46"/>
-</g>
-<!-- 137429052759232 -->
-<g id="node2" class="node">
-<title>137429052759232</title>
-<polygon fill="lightgray" stroke="darkslategray" points="158,-256 84,-256 84,-220 158,-220 158,-256"/>
-<text text-anchor="middle" x="121" y="-234.3" font-family="Courier Bold" font-size="14.00">uniform</text>
-</g>
-<!-- 137429052759232&#45;&gt;137431348365008 -->
-<g id="edge1" class="edge">
-<title>137429052759232&#45;&gt;137431348365008</title>
-<path fill="none" stroke="#666666" stroke-width="1.2" d="M121,-219.81C121,-211.52 121,-201.39 121,-192.16"/>
-<polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="123.8,-192.02 121,-184.02 118.2,-192.02 123.8,-192.02"/>
-</g>
-<!-- 137431348378688 -->
-<g id="node3" class="node">
-<title>137431348378688</title>
-<polygon fill="moccasin" stroke="orange" points="76,-330 22,-330 22,-292 76,-292 76,-330"/>
-<text text-anchor="middle" x="49" y="-314.8" font-family="Sans-Serif" font-size="14.00">var_1</text>
-<text text-anchor="middle" x="49" y="-299.8" font-family="Sans-Serif" font-size="14.00">&#45;1</text>
-</g>
-<!-- 137431348378688&#45;&gt;137429052759232 -->
-<g id="edge2" class="edge">
-<title>137431348378688&#45;&gt;137429052759232</title>
-<path fill="none" stroke="#666666" stroke-width="1.2" d="M67.54,-291.72C76.79,-282.6 88.06,-271.48 97.87,-261.81"/>
-<polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="100.03,-263.61 103.76,-256 96.09,-259.63 100.03,-263.61"/>
-</g>
-<!-- 137429052765232 -->
-<g id="node4" class="node">
-<title>137429052765232</title>
-<polygon fill="moccasin" stroke="orange" points="148,-330 94,-330 94,-292 148,-292 148,-330"/>
-<text text-anchor="middle" x="121" y="-314.8" font-family="Sans-Serif" font-size="14.00">var_2</text>
-<text text-anchor="middle" x="121" y="-299.8" font-family="Sans-Serif" font-size="14.00">1</text>
-</g>
-<!-- 137429052765232&#45;&gt;137429052759232 -->
-<g id="edge3" class="edge">
-<title>137429052765232&#45;&gt;137429052759232</title>
-<path fill="none" stroke="#666666" stroke-width="1.2" d="M121,-291.72C121,-283.29 121,-273.15 121,-264.02"/>
-<polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="123.8,-264 121,-256 118.2,-264 123.8,-264"/>
-</g>
-<!-- 137429050978992 -->
-<g id="node5" class="node">
-<title>137429050978992</title>
-<polygon fill="moccasin" stroke="orange" points="220,-330 166,-330 166,-292 220,-292 220,-330"/>
-<text text-anchor="middle" x="193" y="-314.8" font-family="Sans-Serif" font-size="14.00">var_3</text>
-<text text-anchor="middle" x="193" y="-299.8" font-family="Sans-Serif" font-size="14.00">0</text>
-</g>
-<!-- 137429050978992&#45;&gt;137429052759232 -->
-<g id="edge4" class="edge">
-<title>137429050978992&#45;&gt;137429052759232</title>
-<path fill="none" stroke="#666666" stroke-width="1.2" d="M174.46,-291.72C165.21,-282.6 153.94,-271.48 144.13,-261.81"/>
-<polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="145.91,-259.63 138.24,-256 141.97,-263.61 145.91,-259.63"/>
-</g>
-<!-- 137429050978752 -->
-<g id="node6" class="node">
-<title>137429050978752</title>
-<polygon fill="aliceblue" stroke="skyblue" points="106,-38 52,-38 52,0 106,0 106,-38"/>
-<text text-anchor="middle" x="79" y="-22.8" font-family="Sans-Serif" font-size="14.00">s</text>
-<text text-anchor="middle" x="79" y="-7.8" font-family="Sans-Serif" font-size="14.00">(4,)</text>
-</g>
-<!-- 137429050978800 -->
-<g id="node7" class="node">
-<title>137429050978800</title>
-<polygon fill="honeydew" stroke="darkseagreen" points="72,-184 0,-184 0,-146 72,-146 72,-184"/>
-<text text-anchor="middle" x="36" y="-168.8" font-family="Sans-Serif" font-size="14.00">vector_1</text>
-<text text-anchor="middle" x="36" y="-153.8" font-family="Sans-Serif" font-size="14.00">[0, 2]</text>
-</g>
-<!-- 137429050978800&#45;&gt;137429050979232 -->
-<g id="edge7" class="edge">
-<title>137429050978800&#45;&gt;137429050979232</title>
-<path fill="none" stroke="#666666" stroke-width="1.2" d="M47.07,-145.72C52.39,-136.94 58.82,-126.31 64.52,-116.91"/>
-<polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="66.95,-118.3 68.7,-110 62.16,-115.4 66.95,-118.3"/>
-</g>
-<!-- 137429050979232&#45;&gt;137429050978752 -->
-<g id="edge5" class="edge">
-<title>137429050979232&#45;&gt;137429050978752</title>
-<path fill="none" stroke="#666666" stroke-width="1.2" d="M79,-73.81C79,-65.52 79,-55.39 79,-46.16"/>
-<polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="81.8,-46.02 79,-38.02 76.2,-46.02 81.8,-46.02"/>
-</g>
-<!-- 137429050979184 -->
-<g id="node9" class="node">
-<title>137429050979184</title>
-<polygon fill="aliceblue" stroke="skyblue" points="322,-184 260,-184 260,-146 322,-146 322,-184"/>
-<text text-anchor="middle" x="291" y="-168.8" font-family="Sans-Serif" font-size="14.00">t1</text>
-<text text-anchor="middle" x="291" y="-153.8" font-family="Sans-Serif" font-size="14.00">(4, 5, 6)</text>
-</g>
-<!-- 137429050980048 -->
-<g id="node14" class="node">
-<title>137429050980048</title>
-<polygon fill="lightgray" stroke="darkslategray" points="275,-110 221,-110 221,-74 275,-74 275,-110"/>
-<text text-anchor="middle" x="248" y="-88.3" font-family="Courier Bold" font-size="14.00">sum</text>
-</g>
-<!-- 137429050979184&#45;&gt;137429050980048 -->
-<g id="edge11" class="edge">
-<title>137429050979184&#45;&gt;137429050980048</title>
-<path fill="none" stroke="#666666" stroke-width="1.2" d="M279.93,-145.72C274.61,-136.94 268.18,-126.31 262.48,-116.91"/>
-<polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="264.84,-115.4 258.3,-110 260.05,-118.3 264.84,-115.4"/>
-</g>
-<!-- 137429050979568 -->
-<g id="node10" class="node">
-<title>137429050979568</title>
-<polygon fill="lightgray" stroke="darkslategray" points="332.5,-256 249.5,-256 249.5,-220 332.5,-220 332.5,-256"/>
-<text text-anchor="middle" x="291" y="-234.3" font-family="Courier Bold" font-size="14.00">constant</text>
-</g>
-<!-- 137429050979568&#45;&gt;137429050979184 -->
-<g id="edge8" class="edge">
-<title>137429050979568&#45;&gt;137429050979184</title>
-<path fill="none" stroke="#666666" stroke-width="1.2" d="M291,-219.81C291,-211.52 291,-201.39 291,-192.16"/>
-<polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="293.8,-192.02 291,-184.02 288.2,-192.02 293.8,-192.02"/>
-</g>
-<!-- 137429050979520 -->
-<g id="node11" class="node">
-<title>137429050979520</title>
-<polygon fill="moccasin" stroke="orange" points="318,-330 264,-330 264,-292 318,-292 318,-330"/>
-<text text-anchor="middle" x="291" y="-314.8" font-family="Sans-Serif" font-size="14.00">var_4</text>
-<text text-anchor="middle" x="291" y="-299.8" font-family="Sans-Serif" font-size="14.00">1</text>
-</g>
-<!-- 137429050979520&#45;&gt;137429050979568 -->
-<g id="edge9" class="edge">
-<title>137429050979520&#45;&gt;137429050979568</title>
-<path fill="none" stroke="#666666" stroke-width="1.2" d="M291,-291.72C291,-283.29 291,-273.15 291,-264.02"/>
-<polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="293.8,-264 291,-256 288.2,-264 293.8,-264"/>
-</g>
-<!-- 137429050979664 -->
-<g id="node12" class="node">
-<title>137429050979664</title>
-<polygon fill="aliceblue" stroke="skyblue" points="275,-38 221,-38 221,0 275,0 275,-38"/>
-<text text-anchor="middle" x="248" y="-22.8" font-family="Sans-Serif" font-size="14.00">t2</text>
-<text text-anchor="middle" x="248" y="-7.8" font-family="Sans-Serif" font-size="14.00">(6,)</text>
-</g>
-<!-- 137429050979952 -->
-<g id="node13" class="node">
-<title>137429050979952</title>
-<polygon fill="honeydew" stroke="darkseagreen" points="242,-184 170,-184 170,-146 242,-146 242,-184"/>
-<text text-anchor="middle" x="206" y="-168.8" font-family="Sans-Serif" font-size="14.00">vector_2</text>
-<text text-anchor="middle" x="206" y="-153.8" font-family="Sans-Serif" font-size="14.00">[0, 1]</text>
-</g>
-<!-- 137429050979952&#45;&gt;137429050980048 -->
-<g id="edge12" class="edge">
-<title>137429050979952&#45;&gt;137429050980048</title>
-<path fill="none" stroke="#666666" stroke-width="1.2" d="M216.82,-145.72C222.01,-136.94 228.29,-126.31 233.86,-116.91"/>
-<polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="236.28,-118.31 237.94,-110 231.46,-115.46 236.28,-118.31"/>
-</g>
-<!-- 137429050980048&#45;&gt;137429050979664 -->
-<g id="edge10" class="edge">
-<title>137429050980048&#45;&gt;137429050979664</title>
-<path fill="none" stroke="#666666" stroke-width="1.2" d="M248,-73.81C248,-65.52 248,-55.39 248,-46.16"/>
-<polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="250.8,-46.02 248,-38.02 245.2,-46.02 250.8,-46.02"/>
-</g>
-</g>
-</svg>
diff --git a/front/py/examples/2_ir/5_reduce_sum_keepdim.py b/front/py/examples/2_ir/5_reduce_sum_keepdim.py
index 41bc77c9..e6f1c5e4 100644
--- a/front/py/examples/2_ir/5_reduce_sum_keepdim.py
+++ b/front/py/examples/2_ir/5_reduce_sum_keepdim.py
@@ -1,28 +1,45 @@
 ############-------PyTorch-------################
 
 import torch
-torch_t = torch.arange(60).reshape(3,4,5)
+torch_t = torch.arange(0,60).reshape(3,4,5)
 print(torch_t)
+torch_s = torch.sum(torch_t, dim=[0, 2],keepdim=True)
+print(torch_s)
+torch_p=torch.prod(torch_t,dim=1)
+print(torch_p)
 
-torch_s1 = torch.sum(torch_t, dim=[0, 2],keepdim=True)
-print(torch_s1)
-
+torch_t1 = torch.ones(4, 5, 6,dtype=torch.float)
+print(torch_t1)
+torch_t2 = torch.sum(torch_t1, dim=[0, 1],keepdim=True)
+print(torch_t2)
 
 
 ############-------DEEPX-------################
 
 from deepx import Tensor,ones,zeros,arange
-from deepx.nn.functional import sum,mean
-
-t=arange(0,60,1).reshape_(3,4,5)
-print((t))
-
-s1=sum(t,dim=[0,2],keepdim=True,out="s1")
-print(s1)
-
+from deepx.nn.functional import sum,prod
+
+t=Tensor(shape=(3,4,5))
+t.addtograph("t")
+t.arange_(0,1)
+t.set_format("%.0f")
+print(t)
+s=sum(t,dim=[0,2],out="s",keepdim=True)
+s.set_format("%.0f")
+print(s)
+p=prod(t,dim=[1],out="p",keepdim=True)
+p.set_format("%.0f")
+# print(p)
+
+t1=ones(4,5,6,name="t1")
+t1.set_format("%.0f")
+print(t1)
+t2=sum(t1,dim=[0,1],out='t2',keepdim=True)
+t2.set_format("%.0f")
+print(t2)
 
 
 import os
 script_name = os.path.splitext(os.path.basename( os.path.abspath(__file__)))[0]
-str=t.graph.to_dot()
+str=t2.graph.to_dot()
 str.render(script_name+".dot", format='svg')
\ No newline at end of file
diff --git a/front/py/examples/2_ir/5_reduce_sumprod.dot b/front/py/examples/2_ir/5_reduce_sumprod.dot
new file mode 100644
index 00000000..da812dbb
--- /dev/null
+++ b/front/py/examples/2_ir/5_reduce_sumprod.dot
@@ -0,0 +1,38 @@
+// Computational Graph
+digraph {
+	rankdir=TB
+	node [shape=record]
+	133977343199552 [label="t
+(3, 4, 5)" color=skyblue fillcolor=aliceblue fontname="Sans-Serif" labeljust=l shape=box style=filled]
+	133975085212112 [label="s
+(4,)" color=skyblue fillcolor=aliceblue fontname="Sans-Serif" labeljust=l shape=box style=filled]
+	133975083685904 [label="vector_1
+[0, 2]" color=darkseagreen fillcolor=honeydew fontname="Sans-Serif" labeljust=l shape=box style=filled]
+	133975083685520 [label=sum color=darkslategray fillcolor=lightgray fontname="Courier Bold" labeljust=l shape=box style=filled]
+	133975083685760 [label="p
+(3, 5)" color=skyblue fillcolor=aliceblue fontname="Sans-Serif" labeljust=l shape=box style=filled]
+	133975083686048 [label="vector_2
+[1]" color=darkseagreen fillcolor=honeydew fontname="Sans-Serif" labeljust=l shape=box style=filled]
+	133975083686096 [label=prod color=darkslategray fillcolor=lightgray fontname="Courier Bold" labeljust=l shape=box style=filled]
+	133977343199120 [label="t1
+(4, 5, 6)" color=skyblue fillcolor=aliceblue fontname="Sans-Serif" labeljust=l shape=box style=filled]
+	133975083686528 [label=constant color=darkslategray fillcolor=lightgray fontname="Courier Bold" labeljust=l shape=box style=filled]
+	133975083686288 [label="var_1
+1" color=orange fillcolor=moccasin fontname="Sans-Serif" labeljust=l shape=box style=filled]
+	133975083686240 [label="t2
+(6,)" color=skyblue fillcolor=aliceblue fontname="Sans-Serif" labeljust=l shape=box style=filled]
+	133975083686768 [label="vector_3
+[0, 1]" color=darkseagreen fillcolor=honeydew fontname="Sans-Serif" labeljust=l shape=box style=filled]
+	133975083686576 [label=sum color=darkslategray fillcolor=lightgray fontname="Courier Bold" labeljust=l shape=box style=filled]
+	133975083685520 -> 133975085212112 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	133977343199552 -> 133975083685520 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	133975083685904 -> 133975083685520 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	133975083686096 -> 133975083685760 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	133977343199552 -> 133975083686096 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	133975083686048 -> 133975083686096 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	133975083686528 -> 133977343199120 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	133975083686288 -> 133975083686528 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	133975083686576 -> 133975083686240 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	133977343199120 -> 133975083686576 [arrowsize=0.8 color=gray40 penwidth=1.2]
+	133975083686768 -> 133975083686576 [arrowsize=0.8 color=gray40 penwidth=1.2]
+}
diff --git a/front/py/examples/2_ir/5_reduce_sumprod.dot.svg b/front/py/examples/2_ir/5_reduce_sumprod.dot.svg
new file mode 100644
index 00000000..2b180653
--- /dev/null
+++ b/front/py/examples/2_ir/5_reduce_sumprod.dot.svg
@@ -0,0 +1,166 @@
+<?xml version="1.0" encoding="UTF-8" standalone="no"?>
+<!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN"
+ "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd">
+<!-- Generated by graphviz version 2.43.0 (0)
+ -->
+<!-- Title: %3 Pages: 1 -->
+<svg width="376pt" height="338pt"
+ viewBox="0.00 0.00 375.50 338.00" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink">
+<g id="graph0" class="graph" transform="scale(1 1) rotate(0) translate(4 334)">
+<title>%3</title>
+<polygon fill="white" stroke="transparent" points="-4,4 -4,-334 371.5,-334 371.5,4 -4,4"/>
+<!-- 133977343199552 -->
+<g id="node1" class="node">
+<title>133977343199552</title>
+<polygon fill="aliceblue" stroke="skyblue" points="152,-330 90,-330 90,-292 152,-292 152,-330"/>
+<text text-anchor="middle" x="121" y="-314.8" font-family="Sans-Serif" font-size="14.00">t</text>
+<text text-anchor="middle" x="121" y="-299.8" font-family="Sans-Serif" font-size="14.00">(3, 4, 5)</text>
+</g>
+<!-- 133975083685520 -->
+<g id="node4" class="node">
+<title>133975083685520</title>
+<polygon fill="lightgray" stroke="darkslategray" points="109,-256 55,-256 55,-220 109,-220 109,-256"/>
+<text text-anchor="middle" x="82" y="-234.3" font-family="Courier Bold" font-size="14.00">sum</text>
+</g>
+<!-- 133977343199552&#45;&gt;133975083685520 -->
+<g id="edge2" class="edge">
+<title>133977343199552&#45;&gt;133975083685520</title>
+<path fill="none" stroke="#666666" stroke-width="1.2" d="M110.96,-291.72C106.18,-283.03 100.41,-272.52 95.28,-263.19"/>
+<polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="97.65,-261.67 91.34,-256 92.74,-264.36 97.65,-261.67"/>
+</g>
+<!-- 133975083686096 -->
+<g id="node7" class="node">
+<title>133975083686096</title>
+<polygon fill="lightgray" stroke="darkslategray" points="187,-256 133,-256 133,-220 187,-220 187,-256"/>
+<text text-anchor="middle" x="160" y="-234.3" font-family="Courier Bold" font-size="14.00">prod</text>
+</g>
+<!-- 133977343199552&#45;&gt;133975083686096 -->
+<g id="edge5" class="edge">
+<title>133977343199552&#45;&gt;133975083686096</title>
+<path fill="none" stroke="#666666" stroke-width="1.2" d="M131.04,-291.72C135.82,-283.03 141.59,-272.52 146.72,-263.19"/>
+<polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="149.26,-264.36 150.66,-256 144.35,-261.67 149.26,-264.36"/>
+</g>
+<!-- 133975085212112 -->
+<g id="node2" class="node">
+<title>133975085212112</title>
+<polygon fill="aliceblue" stroke="skyblue" points="109,-184 55,-184 55,-146 109,-146 109,-184"/>
+<text text-anchor="middle" x="82" y="-168.8" font-family="Sans-Serif" font-size="14.00">s</text>
+<text text-anchor="middle" x="82" y="-153.8" font-family="Sans-Serif" font-size="14.00">(4,)</text>
+</g>
+<!-- 133975083685904 -->
+<g id="node3" class="node">
+<title>133975083685904</title>
+<polygon fill="honeydew" stroke="darkseagreen" points="72,-330 0,-330 0,-292 72,-292 72,-330"/>
+<text text-anchor="middle" x="36" y="-314.8" font-family="Sans-Serif" font-size="14.00">vector_1</text>
+<text text-anchor="middle" x="36" y="-299.8" font-family="Sans-Serif" font-size="14.00">[0, 2]</text>
+</g>
+<!-- 133975083685904&#45;&gt;133975083685520 -->
+<g id="edge3" class="edge">
+<title>133975083685904&#45;&gt;133975083685520</title>
+<path fill="none" stroke="#666666" stroke-width="1.2" d="M47.85,-291.72C53.53,-282.94 60.42,-272.31 66.51,-262.91"/>
+<polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="68.98,-264.24 70.98,-256 64.28,-261.19 68.98,-264.24"/>
+</g>
+<!-- 133975083685520&#45;&gt;133975085212112 -->
+<g id="edge1" class="edge">
+<title>133975083685520&#45;&gt;133975085212112</title>
+<path fill="none" stroke="#666666" stroke-width="1.2" d="M82,-219.81C82,-211.52 82,-201.39 82,-192.16"/>
+<polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="84.8,-192.02 82,-184.02 79.2,-192.02 84.8,-192.02"/>
+</g>
+<!-- 133975083685760 -->
+<g id="node5" class="node">
+<title>133975083685760</title>
+<polygon fill="aliceblue" stroke="skyblue" points="187,-184 133,-184 133,-146 187,-146 187,-184"/>
+<text text-anchor="middle" x="160" y="-168.8" font-family="Sans-Serif" font-size="14.00">p</text>
+<text text-anchor="middle" x="160" y="-153.8" font-family="Sans-Serif" font-size="14.00">(3, 5)</text>
+</g>
+<!-- 133975083686048 -->
+<g id="node6" class="node">
+<title>133975083686048</title>
+<polygon fill="honeydew" stroke="darkseagreen" points="242,-330 170,-330 170,-292 242,-292 242,-330"/>
+<text text-anchor="middle" x="206" y="-314.8" font-family="Sans-Serif" font-size="14.00">vector_2</text>
+<text text-anchor="middle" x="206" y="-299.8" font-family="Sans-Serif" font-size="14.00">[1]</text>
+</g>
+<!-- 133975083686048&#45;&gt;133975083686096 -->
+<g id="edge6" class="edge">
+<title>133975083686048&#45;&gt;133975083686096</title>
+<path fill="none" stroke="#666666" stroke-width="1.2" d="M194.15,-291.72C188.47,-282.94 181.58,-272.31 175.49,-262.91"/>
+<polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="177.72,-261.19 171.02,-256 173.02,-264.24 177.72,-261.19"/>
+</g>
+<!-- 133975083686096&#45;&gt;133975083685760 -->
+<g id="edge4" class="edge">
+<title>133975083686096&#45;&gt;133975083685760</title>
+<path fill="none" stroke="#666666" stroke-width="1.2" d="M160,-219.81C160,-211.52 160,-201.39 160,-192.16"/>
+<polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="162.8,-192.02 160,-184.02 157.2,-192.02 162.8,-192.02"/>
+</g>
+<!-- 133977343199120 -->
+<g id="node8" class="node">
+<title>133977343199120</title>
+<polygon fill="aliceblue" stroke="skyblue" points="357,-184 295,-184 295,-146 357,-146 357,-184"/>
+<text text-anchor="middle" x="326" y="-168.8" font-family="Sans-Serif" font-size="14.00">t1</text>
+<text text-anchor="middle" x="326" y="-153.8" font-family="Sans-Serif" font-size="14.00">(4, 5, 6)</text>
+</g>
+<!-- 133975083686576 -->
+<g id="node13" class="node">
+<title>133975083686576</title>
+<polygon fill="lightgray" stroke="darkslategray" points="310,-110 256,-110 256,-74 310,-74 310,-110"/>
+<text text-anchor="middle" x="283" y="-88.3" font-family="Courier Bold" font-size="14.00">sum</text>
+</g>
+<!-- 133977343199120&#45;&gt;133975083686576 -->
+<g id="edge10" class="edge">
+<title>133977343199120&#45;&gt;133975083686576</title>
+<path fill="none" stroke="#666666" stroke-width="1.2" d="M314.93,-145.72C309.61,-136.94 303.18,-126.31 297.48,-116.91"/>
+<polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="299.84,-115.4 293.3,-110 295.05,-118.3 299.84,-115.4"/>
+</g>
+<!-- 133975083686528 -->
+<g id="node9" class="node">
+<title>133975083686528</title>
+<polygon fill="lightgray" stroke="darkslategray" points="367.5,-256 284.5,-256 284.5,-220 367.5,-220 367.5,-256"/>
+<text text-anchor="middle" x="326" y="-234.3" font-family="Courier Bold" font-size="14.00">constant</text>
+</g>
+<!-- 133975083686528&#45;&gt;133977343199120 -->
+<g id="edge7" class="edge">
+<title>133975083686528&#45;&gt;133977343199120</title>
+<path fill="none" stroke="#666666" stroke-width="1.2" d="M326,-219.81C326,-211.52 326,-201.39 326,-192.16"/>
+<polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="328.8,-192.02 326,-184.02 323.2,-192.02 328.8,-192.02"/>
+</g>
+<!-- 133975083686288 -->
+<g id="node10" class="node">
+<title>133975083686288</title>
+<polygon fill="moccasin" stroke="orange" points="353,-330 299,-330 299,-292 353,-292 353,-330"/>
+<text text-anchor="middle" x="326" y="-314.8" font-family="Sans-Serif" font-size="14.00">var_1</text>
+<text text-anchor="middle" x="326" y="-299.8" font-family="Sans-Serif" font-size="14.00">1</text>
+</g>
+<!-- 133975083686288&#45;&gt;133975083686528 -->
+<g id="edge8" class="edge">
+<title>133975083686288&#45;&gt;133975083686528</title>
+<path fill="none" stroke="#666666" stroke-width="1.2" d="M326,-291.72C326,-283.29 326,-273.15 326,-264.02"/>
+<polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="328.8,-264 326,-256 323.2,-264 328.8,-264"/>
+</g>
+<!-- 133975083686240 -->
+<g id="node11" class="node">
+<title>133975083686240</title>
+<polygon fill="aliceblue" stroke="skyblue" points="310,-38 256,-38 256,0 310,0 310,-38"/>
+<text text-anchor="middle" x="283" y="-22.8" font-family="Sans-Serif" font-size="14.00">t2</text>
+<text text-anchor="middle" x="283" y="-7.8" font-family="Sans-Serif" font-size="14.00">(6,)</text>
+</g>
+<!-- 133975083686768 -->
+<g id="node12" class="node">
+<title>133975083686768</title>
+<polygon fill="honeydew" stroke="darkseagreen" points="277,-184 205,-184 205,-146 277,-146 277,-184"/>
+<text text-anchor="middle" x="241" y="-168.8" font-family="Sans-Serif" font-size="14.00">vector_3</text>
+<text text-anchor="middle" x="241" y="-153.8" font-family="Sans-Serif" font-size="14.00">[0, 1]</text>
+</g>
+<!-- 133975083686768&#45;&gt;133975083686576 -->
+<g id="edge11" class="edge">
+<title>133975083686768&#45;&gt;133975083686576</title>
+<path fill="none" stroke="#666666" stroke-width="1.2" d="M251.82,-145.72C257.01,-136.94 263.29,-126.31 268.86,-116.91"/>
+<polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="271.28,-118.31 272.94,-110 266.46,-115.46 271.28,-118.31"/>
+</g>
+<!-- 133975083686576&#45;&gt;133975083686240 -->
+<g id="edge9" class="edge">
+<title>133975083686576&#45;&gt;133975083686240</title>
+<path fill="none" stroke="#666666" stroke-width="1.2" d="M283,-73.81C283,-65.52 283,-55.39 283,-46.16"/>
+<polygon fill="#666666" stroke="#666666" stroke-width="1.2" points="285.8,-46.02 283,-38.02 280.2,-46.02 285.8,-46.02"/>
+</g>
+</g>
+</svg>
diff --git a/front/py/examples/2_ir/5_reduce_sum.py b/front/py/examples/2_ir/5_reduce_sumprod.py
similarity index 63%
rename from front/py/examples/2_ir/5_reduce_sum.py
rename to front/py/examples/2_ir/5_reduce_sumprod.py
index 30698b97..eea1e71b 100644
--- a/front/py/examples/2_ir/5_reduce_sum.py
+++ b/front/py/examples/2_ir/5_reduce_sumprod.py
@@ -1,13 +1,14 @@
 ############-------PyTorch-------################
 
 import torch
-torch_t = torch.empty(3, 4, 5).uniform_(-1, 1)
+torch_t = torch.arange(0,60).reshape(3,4,5)
 print(torch_t)
 torch_s = torch.sum(torch_t, dim=[0, 2])
 print(torch_s)
+torch_p=torch.prod(torch_t,dim=1)
+print(torch_p)
 
-
-torch_t1 = torch.ones(4, 5, 6)
+torch_t1 = torch.ones(4, 5, 6,dtype=torch.float)
 print(torch_t1)
 torch_t2 = torch.sum(torch_t1, dim=[0, 1])
 print(torch_t2)
@@ -16,18 +17,25 @@
 ############-------DEEPX-------################
 
 from deepx import Tensor,ones,zeros,arange
-from deepx.nn.functional import sum,mean
+from deepx.nn.functional import sum,prod
 
 t=Tensor(shape=(3,4,5))
 t.addtograph("t")
-t.uniform_(low=-1,high=1)
-print((t))
+t.arange_(0,1)
+t.set_format("%.0f")
+print(t)
 s=sum(t,dim=[0,2],out="s")
+s.set_format("%.0f")
 print(s)
+p=prod(t,dim=[1],out="p")
+p.set_format("%.0f")
+print(p)
 
 t1=ones(4,5,6,name="t1")
+t1.set_format("%.0f")
 print(t1)
 t2=sum(t1,dim=[0,1],out='t2')
+t2.set_format("%.0f")
 print(t2)