InfiniTensor
diff --git a/‎src/infiniop/elementwise/binary.h‎
Lines changed: 1 addition & 1 deletion b/‎src/infiniop/elementwise/binary.h‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/infiniop/elementwise/cpu/elementwise_cpu_impl.h‎
Lines changed: 131 additions & 0 deletions b/‎src/infiniop/elementwise/cpu/elementwise_cpu_impl.h‎
Lines changed: 131 additions & 0 deletions
diff --git a/‎src/infiniop/elementwise/unary.h‎
Lines changed: 1 addition & 1 deletion b/‎src/infiniop/elementwise/unary.h‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/infiniop/ops/abs/cpu/abs_cpu.cc‎
Lines changed: 2 additions & 42 deletions b/‎src/infiniop/ops/abs/cpu/abs_cpu.cc‎
Lines changed: 2 additions & 42 deletions
diff --git a/‎src/infiniop/ops/acos/cpu/acos_cpu.cc‎
Lines changed: 2 additions & 42 deletions b/‎src/infiniop/ops/acos/cpu/acos_cpu.cc‎
Lines changed: 2 additions & 42 deletions
diff --git a/‎src/infiniop/ops/acosh/cpu/acosh_cpu.cc‎
Lines changed: 2 additions & 42 deletions b/‎src/infiniop/ops/acosh/cpu/acosh_cpu.cc‎
Lines changed: 2 additions & 42 deletions
diff --git a/‎src/infiniop/ops/asin/cpu/asin_cpu.cc‎
Lines changed: 2 additions & 42 deletions b/‎src/infiniop/ops/asin/cpu/asin_cpu.cc‎
Lines changed: 2 additions & 42 deletions
@@ -227,7 +227,7 @@ struct BinaryOp {
     ELEMENTWISE_DESCRIPTOR(OP, NAMESPACE)                                     \
                                                                               \
     namespace op::OP::NAMESPACE {                                             \
-    using Op = op::elementwise::binary::BinaryOp<MODE>; \
+    using Op = op::elementwise::binary::BinaryOp<MODE>;                       \
     }
 
 /**
 
@@ -0,0 +1,131 @@
+#ifndef __INFINIOP_ELEMENTWISE_CPU_IMPL_H__
+#define __INFINIOP_ELEMENTWISE_CPU_IMPL_H__
+
+#include "elementwise_cpu.h"
+#include "../../devices/cpu/common_cpu.h"
+#include "../../../utils/check.h"
+#include "../../../utils/result.hpp"
+
+/**
+ * @brief Generic implementation for elementwise CPU operators.
+ * 
+ * This file provides a generic implementation template that can be used
+ * by all binary and unary operators to reduce code duplication.
+ * 
+ * Usage:
+ *   #include "elementwise_cpu_impl.h"
+ *   namespace op::pow::cpu {
+ *       using Op = op::elementwise::binary::BinaryOp<BinaryMode::Pow>;
+ *       ELEMENTWISE_CPU_IMPL_BINARY(pow)
+ *   }
+ * 
+ *   namespace op::sqrt::cpu {
+ *       using Op = op::elementwise::unary::UnaryOp<UnaryMode::Sqrt>;
+ *       ELEMENTWISE_CPU_IMPL_UNARY(sqrt)
+ *   }
+ */
+
+
+/**
+ * @brief Macro to generate binary operator implementation.
+ * 
+ * This macro generates the Descriptor destructor, create, and calculate methods
+ * for binary operators, using the generic implementation.
+ * 
+ * Usage:
+ *   namespace op::pow::cpu {
+ *       using Op = op::elementwise::binary::BinaryOp<BinaryMode::Pow>;
+ *       ELEMENTWISE_CPU_IMPL_BINARY(pow)
+ *   }
+ */
+#define ELEMENTWISE_CPU_IMPL_BINARY(OP)                                          \
+                                                                                \
+    Descriptor::~Descriptor() = default;                                        \
+                                                                                \
+    infiniStatus_t Descriptor::create(                                           \
+        infiniopHandle_t handle_,                                                \
+        Descriptor **desc_ptr,                                                   \
+        infiniopTensorDescriptor_t out_desc,                                     \
+        std::vector<infiniopTensorDescriptor_t> input_desc_vec) {                \
+        auto handle = reinterpret_cast<device::cpu::Handle *>(handle_);         \
+        auto dtype = out_desc->dtype();                                         \
+        const auto &a_desc = input_desc_vec.at(0);                               \
+        const auto &b_desc = input_desc_vec.at(1);                               \
+        const auto &out_shape = out_desc->shape();                               \
+        const auto &a_shape = a_desc->shape();                                  \
+        const auto &b_shape = b_desc->shape();                                    \
+        CHECK_DTYPE(dtype, INFINI_DTYPE_F16, INFINI_DTYPE_F32);                  \
+        CHECK_SAME_SHAPE(out_shape, a_shape, b_shape);                          \
+        CREATE_ELEMENTWISE_CPU_DESCRIPTOR(handle, dtype, out_desc, input_desc_vec); \
+        return INFINI_STATUS_SUCCESS;                                            \
+    }                                                                           \
+                                                                                \
+    infiniStatus_t Descriptor::calculate(                                        \
+        void *workspace,                                                         \
+        size_t workspace_size,                                                  \
+        void *output,                                                            \
+        std::vector<const void *> inputs,                                        \
+        void *stream) const {                                                    \
+        switch (_dtype) {                                                       \
+        case INFINI_DTYPE_F16:                                                  \
+            return _device_info->template calculate<Op, fp16_t>(                \
+                _info, output, inputs, stream);                                 \
+        case INFINI_DTYPE_F32:                                                  \
+            return _device_info->template calculate<Op, float>(                 \
+                _info, output, inputs, stream);                                  \
+        default:                                                                 \
+            return INFINI_STATUS_BAD_TENSOR_DTYPE;                              \
+        }                                                                       \
+    }
+
+/**
+ * @brief Macro to generate unary operator implementation.
+ * 
+ * This macro generates the Descriptor destructor, create, and calculate methods
+ * for unary operators, using the generic implementation.
+ * 
+ * Usage:
+ *   namespace op::sqrt::cpu {
+ *       using Op = op::elementwise::unary::UnaryOp<UnaryMode::Sqrt>;
+ *       ELEMENTWISE_CPU_IMPL_UNARY(sqrt)
+ *   }
+ */
+#define ELEMENTWISE_CPU_IMPL_UNARY(OP)                                           \
+                                                                                \
+    Descriptor::~Descriptor() = default;                                        \
+                                                                                \
+    infiniStatus_t Descriptor::create(                                           \
+        infiniopHandle_t handle_,                                                \
+        Descriptor **desc_ptr,                                                   \
+        infiniopTensorDescriptor_t out_desc,                                     \
+        std::vector<infiniopTensorDescriptor_t> input_desc_vec) {                \
+        auto handle = reinterpret_cast<device::cpu::Handle *>(handle_);         \
+        auto dtype = out_desc->dtype();                                         \
+        const auto &x_desc = input_desc_vec.at(0);                               \
+        const auto &y_shape = out_desc->shape();                                 \
+        const auto &x_shape = x_desc->shape();                                   \
+        CHECK_DTYPE(dtype, INFINI_DTYPE_F16, INFINI_DTYPE_F32);                  \
+        CHECK_SAME_SHAPE(y_shape, x_shape);                                      \
+        CREATE_ELEMENTWISE_CPU_DESCRIPTOR(handle, dtype, out_desc, input_desc_vec); \
+        return INFINI_STATUS_SUCCESS;                                            \
+    }                                                                           \
+                                                                                \
+    infiniStatus_t Descriptor::calculate(                                        \
+        void *workspace,                                                         \
+        size_t workspace_size,                                                  \
+        void *output,                                                            \
+        std::vector<const void *> inputs,                                        \
+        void *stream) const {                                                    \
+        switch (_dtype) {                                                       \
+        case INFINI_DTYPE_F16:                                                  \
+            return _device_info->template calculate<Op, fp16_t>(                \
+                _info, output, inputs, stream);                                 \
+        case INFINI_DTYPE_F32:                                                  \
+            return _device_info->template calculate<Op, float>(                 \
+                _info, output, inputs, stream);                                  \
+        default:                                                                 \
+            return INFINI_STATUS_BAD_TENSOR_DTYPE;                              \
+        }                                                                       \
+    }
+
+#endif // __INFINIOP_ELEMENTWISE_CPU_IMPL_H__
@@ -508,7 +508,7 @@ struct UnaryOp {
     ELEMENTWISE_DESCRIPTOR(OP, NAMESPACE)                                     \
                                                                               \
     namespace op::OP::NAMESPACE {                                             \
-    using Op = op::elementwise::unary::UnaryOp<MODE>; \
+    using Op = op::elementwise::unary::UnaryOp<MODE>;                         \
     }
 
 } // namespace op::elementwise::unary
 
@@ -1,48 +1,8 @@
 #include "abs_cpu.h"
+#include "../../../elementwise/cpu/elementwise_cpu_impl.h"
 
 namespace op::abs::cpu {
 
-Descriptor::~Descriptor() = default;
+ELEMENTWISE_CPU_IMPL_UNARY(abs)
 
-infiniStatus_t Descriptor::create(
-    infiniopHandle_t handle_,
-    Descriptor **desc_ptr,
-    infiniopTensorDescriptor_t out_desc,
-    std::vector<infiniopTensorDescriptor_t> input_desc_vec) {
-
-    auto handle = reinterpret_cast<device::cpu::Handle *>(handle_);
-    auto dtype = out_desc->dtype();
-
-    const auto &x_desc = input_desc_vec.at(0);
-    const auto &y_shape = out_desc->shape();
-    const auto &x_shape = x_desc->shape();
-
-    CHECK_DTYPE(dtype, INFINI_DTYPE_F16, INFINI_DTYPE_F32);
-
-    CHECK_SAME_SHAPE(y_shape, x_shape);
-
-    // create CPU elementwise descriptor
-    CREATE_ELEMENTWISE_CPU_DESCRIPTOR(handle, dtype, out_desc, input_desc_vec);
-
-    return INFINI_STATUS_SUCCESS;
-}
-
-infiniStatus_t Descriptor::calculate(
-    void *workspace,
-    size_t workspace_size,
-    void *output,
-    std::vector<const void *> inputs,
-    void *stream) const {
-
-    switch (_dtype) {
-    case INFINI_DTYPE_F16:
-        return _device_info->calculate<Op, fp16_t>(_info, output, inputs, stream);
-    case INFINI_DTYPE_F32:
-        return _device_info->calculate<Op, float>(_info, output, inputs, stream);
-    default:
-        return INFINI_STATUS_BAD_TENSOR_DTYPE;
-    }
-
-    return INFINI_STATUS_SUCCESS;
-}
 } // namespace op::abs::cpu
@@ -1,48 +1,8 @@
 #include "acos_cpu.h"
+#include "../../../elementwise/cpu/elementwise_cpu_impl.h"
 
 namespace op::acos::cpu {
 
-Descriptor::~Descriptor() = default;
+ELEMENTWISE_CPU_IMPL_UNARY(acos)
 
-infiniStatus_t Descriptor::create(
-    infiniopHandle_t handle_,
-    Descriptor **desc_ptr,
-    infiniopTensorDescriptor_t out_desc,
-    std::vector<infiniopTensorDescriptor_t> input_desc_vec) {
-
-    auto handle = reinterpret_cast<device::cpu::Handle *>(handle_);
-    auto dtype = out_desc->dtype();
-
-    const auto &x_desc = input_desc_vec.at(0);
-    const auto &y_shape = out_desc->shape();
-    const auto &x_shape = x_desc->shape();
-
-    CHECK_DTYPE(dtype, INFINI_DTYPE_F16, INFINI_DTYPE_F32);
-
-    CHECK_SAME_SHAPE(y_shape, x_shape);
-
-    // create CPU elementwise descriptor
-    CREATE_ELEMENTWISE_CPU_DESCRIPTOR(handle, dtype, out_desc, input_desc_vec);
-
-    return INFINI_STATUS_SUCCESS;
-}
-
-infiniStatus_t Descriptor::calculate(
-    void *workspace,
-    size_t workspace_size,
-    void *output,
-    std::vector<const void *> inputs,
-    void *stream) const {
-
-    switch (_dtype) {
-    case INFINI_DTYPE_F16:
-        return _device_info->calculate<Op, fp16_t>(_info, output, inputs, stream);
-    case INFINI_DTYPE_F32:
-        return _device_info->calculate<Op, float>(_info, output, inputs, stream);
-    default:
-        return INFINI_STATUS_BAD_TENSOR_DTYPE;
-    }
-
-    return INFINI_STATUS_SUCCESS;
-}
 } // namespace op::acos::cpu
@@ -1,48 +1,8 @@
 #include "acosh_cpu.h"
+#include "../../../elementwise/cpu/elementwise_cpu_impl.h"
 
 namespace op::acosh::cpu {
 
-Descriptor::~Descriptor() = default;
+ELEMENTWISE_CPU_IMPL_UNARY(acosh)
 
-infiniStatus_t Descriptor::create(
-    infiniopHandle_t handle_,
-    Descriptor **desc_ptr,
-    infiniopTensorDescriptor_t out_desc,
-    std::vector<infiniopTensorDescriptor_t> input_desc_vec) {
-
-    auto handle = reinterpret_cast<device::cpu::Handle *>(handle_);
-    auto dtype = out_desc->dtype();
-
-    const auto &x_desc = input_desc_vec.at(0);
-    const auto &y_shape = out_desc->shape();
-    const auto &x_shape = x_desc->shape();
-
-    CHECK_DTYPE(dtype, INFINI_DTYPE_F16, INFINI_DTYPE_F32);
-
-    CHECK_SAME_SHAPE(y_shape, x_shape);
-
-    // create CPU elementwise descriptor
-    CREATE_ELEMENTWISE_CPU_DESCRIPTOR(handle, dtype, out_desc, input_desc_vec);
-
-    return INFINI_STATUS_SUCCESS;
-}
-
-infiniStatus_t Descriptor::calculate(
-    void *workspace,
-    size_t workspace_size,
-    void *output,
-    std::vector<const void *> inputs,
-    void *stream) const {
-
-    switch (_dtype) {
-    case INFINI_DTYPE_F16:
-        return _device_info->calculate<Op, fp16_t>(_info, output, inputs, stream);
-    case INFINI_DTYPE_F32:
-        return _device_info->calculate<Op, float>(_info, output, inputs, stream);
-    default:
-        return INFINI_STATUS_BAD_TENSOR_DTYPE;
-    }
-
-    return INFINI_STATUS_SUCCESS;
-}
 } // namespace op::acosh::cpu
@@ -1,48 +1,8 @@
 #include "asin_cpu.h"
+#include "../../../elementwise/cpu/elementwise_cpu_impl.h"
 
 namespace op::asin::cpu {
 
-Descriptor::~Descriptor() = default;
+ELEMENTWISE_CPU_IMPL_UNARY(asin)
 
-infiniStatus_t Descriptor::create(
-    infiniopHandle_t handle_,
-    Descriptor **desc_ptr,
-    infiniopTensorDescriptor_t out_desc,
-    std::vector<infiniopTensorDescriptor_t> input_desc_vec) {
-
-    auto handle = reinterpret_cast<device::cpu::Handle *>(handle_);
-    auto dtype = out_desc->dtype();
-
-    const auto &x_desc = input_desc_vec.at(0);
-    const auto &y_shape = out_desc->shape();
-    const auto &x_shape = x_desc->shape();
-
-    CHECK_DTYPE(dtype, INFINI_DTYPE_F16, INFINI_DTYPE_F32);
-
-    CHECK_SAME_SHAPE(y_shape, x_shape);
-
-    // create CPU elementwise descriptor
-    CREATE_ELEMENTWISE_CPU_DESCRIPTOR(handle, dtype, out_desc, input_desc_vec);
-
-    return INFINI_STATUS_SUCCESS;
-}
-
-infiniStatus_t Descriptor::calculate(
-    void *workspace,
-    size_t workspace_size,
-    void *output,
-    std::vector<const void *> inputs,
-    void *stream) const {
-
-    switch (_dtype) {
-    case INFINI_DTYPE_F16:
-        return _device_info->calculate<Op, fp16_t>(_info, output, inputs, stream);
-    case INFINI_DTYPE_F32:
-        return _device_info->calculate<Op, float>(_info, output, inputs, stream);
-    default:
-        return INFINI_STATUS_BAD_TENSOR_DTYPE;
-    }
-
-    return INFINI_STATUS_SUCCESS;
-}
 } // namespace op::asin::cpu
Original file line number	Diff line number	Diff line change
`@@ -227,7 +227,7 @@ struct BinaryOp {`
`227`	`227`	`ELEMENTWISE_DESCRIPTOR(OP, NAMESPACE) \`
`228`	`228`	`\`
`229`	`229`	`namespace op::OP::NAMESPACE { \`
`230`		`- using Op = op::elementwise::binary::BinaryOp<MODE>; \`
	`230`	`+ using Op = op::elementwise::binary::BinaryOp<MODE>; \`
`231`	`231`	`}`
`232`	`232`
`233`	`233`	`/**`
Original file line number	Diff line number	Diff line change
`@@ -508,7 +508,7 @@ struct UnaryOp {`
`508`	`508`	`ELEMENTWISE_DESCRIPTOR(OP, NAMESPACE) \`
`509`	`509`	`\`
`510`	`510`	`namespace op::OP::NAMESPACE { \`
`511`		`- using Op = op::elementwise::unary::UnaryOp<MODE>; \`
	`511`	`+ using Op = op::elementwise::unary::UnaryOp<MODE>; \`
`512`	`512`	`}`
`513`	`513`
`514`	`514`	`} // namespace op::elementwise::unary`