forked from jiuyuan/InfiniTensor
7f16fa353e
feat: Add Gelu kernel, operator, ffi. |
||
---|---|---|
.. | ||
cuda_clip.h | ||
cuda_common.h | ||
cuda_element_wise.h | ||
cuda_expand.h | ||
cuda_kernel_wihtout_config.h | ||
cuda_pad_slice.h | ||
cuda_runtime.h | ||
cuda_split_concat.h | ||
cuda_transpose.h | ||
cuda_unary.h | ||
cuda_utility.h | ||
cuda_where.h | ||
gather.h | ||
gbmm_g2bmm.cuh | ||
gbmm_g2bmm.h | ||
nccl_communicator.h | ||
operator_timer.h | ||
resize.cuh | ||
softmax.h |