Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
9 changes: 9 additions & 0 deletions include/infiniop.h
Original file line number Diff line number Diff line change
Expand Up @@ -4,18 +4,27 @@
#include "infiniop/handle.h"
#include "infiniop/ops/add.h"
#include "infiniop/ops/attention.h"
#include "infiniop/ops/cast.h"
#include "infiniop/ops/causal_softmax.h"
#include "infiniop/ops/clip.h"
#include "infiniop/ops/conv.h"
#include "infiniop/ops/cos.h"
#include "infiniop/ops/exp.h"
#include "infiniop/ops/gemm.h"
#include "infiniop/ops/hard_swish.h"
#include "infiniop/ops/leaky_relu.h"
#include "infiniop/ops/mul.h"
#include "infiniop/ops/random_sample.h"
#include "infiniop/ops/rearrange.h"
#include "infiniop/ops/relu.h"
#include "infiniop/ops/rms_norm.h"
#include "infiniop/ops/rope.h"
#include "infiniop/ops/sigmoid_backward.h"
#include "infiniop/ops/sub.h"
#include "infiniop/ops/swiglu.h"
#include "infiniop/tensor_descriptor.h"
#include "infiniop/ops/tanh.h"
#include "infiniop/ops/sin.h"
#include "infiniop/ops/where.h"

#endif // __INFINIOP_API_H__
24 changes: 24 additions & 0 deletions include/infiniop/ops/cast.h
Original file line number Diff line number Diff line change
@@ -0,0 +1,24 @@
#ifndef __INFINIOP_CAST_API_H__
#define __INFINIOP_CAST_API_H__

#include "../operator_descriptor.h"

typedef struct InfiniopDescriptor *infiniopCastDescriptor_t;

__C __export infiniStatus_t infiniopCreateCastDescriptor(infiniopHandle_t handle,
infiniopCastDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t output,
infiniopTensorDescriptor_t input);

__C __export infiniStatus_t infiniopGetCastWorkspaceSize(infiniopCastDescriptor_t desc, size_t *size);

__C __export infiniStatus_t infiniopCast(infiniopCastDescriptor_t desc,
void *workspace,
size_t workspace_size,
void *output,
const void *input,
void *stream);

__C __export infiniStatus_t infiniopDestroyCastDescriptor(infiniopCastDescriptor_t desc);

#endif
24 changes: 24 additions & 0 deletions include/infiniop/ops/cos.h
Original file line number Diff line number Diff line change
@@ -0,0 +1,24 @@
#ifndef __INFINIOP_COS_API_H__
#define __INFINIOP_COS_API_H__

#include "../operator_descriptor.h"

typedef struct InfiniopDescriptor *infiniopCosDescriptor_t;

__C __export infiniStatus_t infiniopCreateCosDescriptor(infiniopHandle_t handle,
infiniopCosDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t output,
infiniopTensorDescriptor_t input);

__C __export infiniStatus_t infiniopGetCosWorkspaceSize(infiniopCosDescriptor_t desc, size_t *size);

__C __export infiniStatus_t infiniopCos(infiniopCosDescriptor_t desc,
void *workspace,
size_t workspace_size,
void *output,
const void *input,
void *stream);

__C __export infiniStatus_t infiniopDestroyCosDescriptor(infiniopCosDescriptor_t desc);

#endif
24 changes: 24 additions & 0 deletions include/infiniop/ops/exp.h
Original file line number Diff line number Diff line change
@@ -0,0 +1,24 @@
#ifndef __INFINIOP_EXP_API_H__
#define __INFINIOP_EXP_API_H__

#include "../operator_descriptor.h"

typedef struct InfiniopDescriptor *infiniopExpDescriptor_t;

__C __export infiniStatus_t infiniopCreateExpDescriptor(infiniopHandle_t handle,
infiniopExpDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t output,
infiniopTensorDescriptor_t input);

__C __export infiniStatus_t infiniopGetExpWorkspaceSize(infiniopExpDescriptor_t desc, size_t *size);

__C __export infiniStatus_t infiniopExp(infiniopExpDescriptor_t desc,
void *workspace,
size_t workspace_size,
void *output,
const void *input,
void *stream);

__C __export infiniStatus_t infiniopDestroyExpDescriptor(infiniopExpDescriptor_t desc);

#endif
24 changes: 24 additions & 0 deletions include/infiniop/ops/hard_swish.h
Original file line number Diff line number Diff line change
@@ -0,0 +1,24 @@
#ifndef __INFINIOP_HARD_SWISH_API_H__
#define __INFINIOP_HARD_SWISH_API_H__

#include "../operator_descriptor.h"

typedef struct InfiniopDescriptor *infiniopHardSwishDescriptor_t;

__C __export infiniStatus_t infiniopCreateHardSwishDescriptor(infiniopHandle_t handle,
infiniopHardSwishDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t output,
infiniopTensorDescriptor_t input);

__C __export infiniStatus_t infiniopGetHardSwishWorkspaceSize(infiniopHardSwishDescriptor_t desc, size_t *size);

__C __export infiniStatus_t infiniopHardSwish(infiniopHardSwishDescriptor_t desc,
void *workspace,
size_t workspace_size,
void *output,
const void *input,
void *stream);

__C __export infiniStatus_t infiniopDestroyHardSwishDescriptor(infiniopHardSwishDescriptor_t desc);

#endif
39 changes: 39 additions & 0 deletions include/infiniop/ops/leaky_relu.h
Original file line number Diff line number Diff line change
@@ -0,0 +1,39 @@
#ifndef __INFINIOP_LEAKY_RELU_API_H__
#define __INFINIOP_LEAKY_RELU_API_H__

#include "../operator_descriptor.h"

typedef struct InfiniopDescriptor *infiniopLeakyReluDescriptor_t;

/// @brief 创建 LeakyReLU 描述符
/// @param handle 上下文句柄
/// @param desc_ptr 输出的算子描述符
/// @param output 输出张量描述符
/// @param input 输入张量描述符
/// @param negative_slope 负斜率 α,float 类型
__C __export infiniStatus_t infiniopCreateLeakyReluDescriptor(
infiniopHandle_t handle,
infiniopLeakyReluDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t output,
infiniopTensorDescriptor_t input);

/// @brief 获取 workspace 大小
__C __export infiniStatus_t infiniopGetLeakyReluWorkspaceSize(
infiniopLeakyReluDescriptor_t desc,
size_t *size);

/// @brief 执行 LeakyReLU 运算
__C __export infiniStatus_t infiniopLeakyRelu(
infiniopLeakyReluDescriptor_t desc,
void *workspace,
size_t workspace_size,
void *output,
const void *input,
float negative_slope,
void *stream);

/// @brief 销毁 LeakyReLU 描述符
__C __export infiniStatus_t infiniopDestroyLeakyReluDescriptor(
infiniopLeakyReluDescriptor_t desc);

#endif // __INFINIOP_LEAKY_RELU_API_H__
26 changes: 26 additions & 0 deletions include/infiniop/ops/sigmoid_backward.h
Original file line number Diff line number Diff line change
@@ -0,0 +1,26 @@
#ifndef __INFINIOP_SIGMOID_BACKWARD_API_H__
#define __INFINIOP_SIGMOID_BACKWARD_API_H__

#include "../operator_descriptor.h"

typedef struct InfiniopDescriptor *infiniopSigmoidBackwardDescriptor_t;

__C __export infiniStatus_t infiniopCreateSigmoidBackwardDescriptor(infiniopHandle_t handle,
infiniopSigmoidBackwardDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t grad_input,
infiniopTensorDescriptor_t grad_output,
infiniopTensorDescriptor_t input);

__C __export infiniStatus_t infiniopGetSigmoidBackwardWorkspaceSize(infiniopSigmoidBackwardDescriptor_t desc, size_t *size);

__C __export infiniStatus_t infiniopSigmoidBackward(infiniopSigmoidBackwardDescriptor_t desc,
void *workspace,
size_t workspace_size,
void *grad_input,
const void *grad_output,
const void *input,
void *stream);

__C __export infiniStatus_t infiniopDestroySigmoidBackwardDescriptor(infiniopSigmoidBackwardDescriptor_t desc);

#endif
24 changes: 24 additions & 0 deletions include/infiniop/ops/sin.h
Original file line number Diff line number Diff line change
@@ -0,0 +1,24 @@
#ifndef __INFINIOP_SIN_API_H__
#define __INFINIOP_SIN_API_H__

#include "../operator_descriptor.h"

typedef struct InfiniopDescriptor *infiniopSinDescriptor_t;

__C __export infiniStatus_t infiniopCreateSinDescriptor(infiniopHandle_t handle,
infiniopSinDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t output,
infiniopTensorDescriptor_t input);

__C __export infiniStatus_t infiniopGetSinWorkspaceSize(infiniopSinDescriptor_t desc, size_t *size);

__C __export infiniStatus_t infiniopSin(infiniopSinDescriptor_t desc,
void *workspace,
size_t workspace_size,
void *output,
const void *input,
void *stream);

__C __export infiniStatus_t infiniopDestroySinDescriptor(infiniopSinDescriptor_t desc);

#endif
24 changes: 24 additions & 0 deletions include/infiniop/ops/tanh.h
Original file line number Diff line number Diff line change
@@ -0,0 +1,24 @@
#ifndef __INFINIOP_TANH_API_H__
#define __INFINIOP_TANH_API_H__

#include "../operator_descriptor.h"

typedef struct InfiniopDescriptor *infiniopTanhDescriptor_t;

__C __export infiniStatus_t infiniopCreateTanhDescriptor(infiniopHandle_t handle,
infiniopTanhDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t output,
infiniopTensorDescriptor_t input);

__C __export infiniStatus_t infiniopGetTanhWorkspaceSize(infiniopTanhDescriptor_t desc, size_t *size);

__C __export infiniStatus_t infiniopTanh(infiniopTanhDescriptor_t desc,
void *workspace,
size_t workspace_size,
void *output,
const void *input,
void *stream);

__C __export infiniStatus_t infiniopDestroyTanhDescriptor(infiniopTanhDescriptor_t desc);

#endif
30 changes: 30 additions & 0 deletions include/infiniop/ops/where.h
Original file line number Diff line number Diff line change
@@ -0,0 +1,30 @@
#ifndef __INFINIOP_WHERE_API_H__
#define __INFINIOP_WHERE_API_H__

#include "../operator_descriptor.h"

typedef struct InfiniopDescriptor *infiniopWhereDescriptor_t;

__C __export infiniStatus_t infiniopCreateWhereDescriptor(
infiniopHandle_t handle,
infiniopWhereDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t c_desc,
infiniopTensorDescriptor_t a_desc,
infiniopTensorDescriptor_t b_desc,
infiniopTensorDescriptor_t condition_desc);

__C __export infiniStatus_t infiniopGetWhereWorkspaceSize(
infiniopWhereDescriptor_t desc,
size_t *size);

__C __export infiniStatus_t infiniopWhere(
infiniopWhereDescriptor_t desc,
void *workspace,
size_t workspace_size,
void *c,
const void *a,
const void *b,
const void *condition,
void *stream);

#endif // __INFINIOP_WHERE_API_H__
46 changes: 46 additions & 0 deletions src/infiniop/ops/cast/cast.h
Original file line number Diff line number Diff line change
@@ -0,0 +1,46 @@
#ifndef __CAST_H__
#define __CAST_H__

#include "../../operator.h"

#define DESCRIPTOR(NAMESPACE) \
namespace op::cast::NAMESPACE { \
class Descriptor final : public InfiniopDescriptor { \
infiniDtype_t _output_dtype; \
infiniDtype_t _input_dtype; \
op::elementwise::ElementwiseInfo _info; \
std::unique_ptr<op::elementwise::NAMESPACE::DeviceImpl> _device_info; \
size_t _workspace_size; \
Descriptor( \
infiniDtype_t _out_dtype, \
infiniDtype_t _input_dtype, \
op::elementwise::ElementwiseInfo info, \
op::elementwise::NAMESPACE::DeviceImpl *device_info, \
size_t workspace_size_, \
infiniDevice_t device_type, \
int device_id) \
: InfiniopDescriptor{device_type, device_id}, \
_output_dtype(_out_dtype), \
_input_dtype(_input_dtype), \
_info(std::move(info)), \
_device_info(std::move(device_info)), \
_workspace_size(workspace_size_) {} \
public: \
~Descriptor(); \
size_t workspaceSize() const { return _workspace_size; } \
static infiniStatus_t create( \
infiniopHandle_t handle, \
Descriptor **desc_ptr, \
infiniopTensorDescriptor_t output_desc, \
std::vector<infiniopTensorDescriptor_t> input_descs); \
infiniStatus_t calculate( \
void *workspace, size_t workspace_size, \
void *output, \
std::vector<const void *> inputs, \
void *stream) const; \
}; \
}


#endif

Loading