InfiniTensor/test/kernels/kunlun/test_kunlun_transpose.cc

#include "core/graph.h"
#include "core/kernel.h"
#include "core/runtime.h"
#include "kunlun/kunlun_runtime.h"
#include "operators/transpose.h"

#include "test.h"

namespace infini {

template <class T>
void testTranspose(
    const std::function<void(void *, size_t, DataType)> &generator,
    const Shape &shape) {
    // Runtime
    Runtime cpuRuntime = NativeCpuRuntimeObj::getInstance();
    auto xpuRuntime = make_ref<KUNLUNRuntimeObj>();

    // Build input data on CPU
    Tensor inputCpu = make_ref<TensorObj>(shape, DataType::Float32, cpuRuntime);
    inputCpu->dataMalloc();
    inputCpu->setData(generator);

    // GPU
    Graph xpuGraph = make_ref<GraphObj>(xpuRuntime);
    auto inputGpu = xpuGraph->cloneTensor(inputCpu);
    vector<int> permute = {0, 1, 3, 2};
    auto gpuOp = xpuGraph->addOp<T>(inputGpu, nullptr, permute);
    xpuGraph->dataMalloc();
    xpuRuntime->run(xpuGraph);
    auto outputGpu = gpuOp->getOutput();
    auto outputGpu2Cpu = outputGpu->clone(cpuRuntime);
    // Check
    inputCpu->printData();
    outputGpu2Cpu->printData();
    EXPECT_TRUE(1);
}

TEST(xpu_Transpose, run) {
    testTranspose<TransposeObj>(IncrementalGenerator(), Shape{1, 1, 2, 3});
}

} // namespace infini
Xpu (#82) * support kunlun xpu and add an operator named Add * add sub, mul, div, pow, maximum, minimum * add code * add xpu code * add code * add matmul * add transpose * add unary operator * add unary operator * add some operator * add code * support run resnet18 on xpu * add code * add max pool2d * fix xpu code, let it can run. * 添加XPU算子 (#120) * add floordiv for xpu * add batchnorm for xpu * add more cast types for xpu * add conv_trans for xpu * add pad for xpu * add logical ops for xpu * fix format for xpu src and include * fix format for xpu test * fix format for xpu src --------- Co-authored-by: Bolun <bolunz@u.nus.edu> * Xpu abs (#121) * add: unary kernel for xpu * formatting * format * format * format * fix: pointer jump * fix optype comments * fix bug introduced while resolving conflict * change cmake option for kunlunxin xpu from 'xpu' to 'kunlun'; fix bug after merging distributed infrastructure * Add doc support for xpu (#141) * fix * fix * fix pooling test * format * format * fix * fix * set cmake version requirement * fix cmakelists * rename xpu to kunlun * fix * fix format * fix format * fix format * fix change name to kunlun * format * fix format * clang format * fix format --------- Co-authored-by: root <root@localhost.localdomain> Co-authored-by: wanghailu <wanghailu@qiyuanlab.com> Co-authored-by: wanghailu <wanghailu0717@163.com> Co-authored-by: Bolun Zhang <48948016+Chamberlain0w0@users.noreply.github.com> Co-authored-by: Bolun <bolunz@u.nus.edu> Co-authored-by: zhangyue207 <138768300+zhangyue207@users.noreply.github.com> Co-authored-by: Haojie Wang <haojie0429@gmail.com> Co-authored-by: baominghelly <41820386+baominghelly@users.noreply.github.com> Co-authored-by: Bolun <chamberlain0w0@gmail.com> 2023-10-16 10:57:08 +08:00			`#include "core/graph.h"`
			`#include "core/kernel.h"`
			`#include "core/runtime.h"`
			`#include "kunlun/kunlun_runtime.h"`
			`#include "operators/transpose.h"`

			`#include "test.h"`

			`namespace infini {`

			`template <class T>`
			`void testTranspose(`
			`const std::function<void(void *, size_t, DataType)> &generator,`
			`const Shape &shape) {`
			`// Runtime`
			`Runtime cpuRuntime = NativeCpuRuntimeObj::getInstance();`
			`auto xpuRuntime = make_ref<KUNLUNRuntimeObj>();`

			`// Build input data on CPU`
			`Tensor inputCpu = make_ref<TensorObj>(shape, DataType::Float32, cpuRuntime);`
			`inputCpu->dataMalloc();`
			`inputCpu->setData(generator);`

			`// GPU`
			`Graph xpuGraph = make_ref<GraphObj>(xpuRuntime);`
			`auto inputGpu = xpuGraph->cloneTensor(inputCpu);`
			`vector<int> permute = {0, 1, 3, 2};`
			`auto gpuOp = xpuGraph->addOp<T>(inputGpu, nullptr, permute);`
			`xpuGraph->dataMalloc();`
			`xpuRuntime->run(xpuGraph);`
			`auto outputGpu = gpuOp->getOutput();`
			`auto outputGpu2Cpu = outputGpu->clone(cpuRuntime);`
			`// Check`
			`inputCpu->printData();`
			`outputGpu2Cpu->printData();`
			`EXPECT_TRUE(1);`
			`}`

			`TEST(xpu_Transpose, run) {`
			`testTranspose<TransposeObj>(IncrementalGenerator(), Shape{1, 1, 2, 3});`
			`}`

			`} // namespace infini`