InfiniTensor/include/kunlun/kunlun_kernel_without_config.h

#pragma once
#include "core/kernel.h"
#include "kunlun/kunlun_runtime.h"

namespace infini {

class KUNLUNKernelWithoutConfig : public Kernel {
  public:
    virtual void compute(const Operator &op, const PerfRecord &record,
                         const RuntimeObj *context) const {
        compute(op, context);
    }
    virtual void compute(const Operator &op,
                         const RuntimeObj *context) const = 0;
    // Premise: op is idempotent since it is called multiple times.
    virtual PerfRecord tune(const Operator &op,
                            const RuntimeObj *_context) const {
        auto context = dynamic_cast<const KUNLUNRuntimeObj *>(_context);
        return make_ref<PerfRecordObj>(timeit([&]() { compute(op, _context); },
                                              [&]() { context->sync(); }));
    }
};

} // namespace infini
Xpu (#82) * support kunlun xpu and add an operator named Add * add sub, mul, div, pow, maximum, minimum * add code * add xpu code * add code * add matmul * add transpose * add unary operator * add unary operator * add some operator * add code * support run resnet18 on xpu * add code * add max pool2d * fix xpu code, let it can run. * 添加XPU算子 (#120) * add floordiv for xpu * add batchnorm for xpu * add more cast types for xpu * add conv_trans for xpu * add pad for xpu * add logical ops for xpu * fix format for xpu src and include * fix format for xpu test * fix format for xpu src --------- Co-authored-by: Bolun <bolunz@u.nus.edu> * Xpu abs (#121) * add: unary kernel for xpu * formatting * format * format * format * fix: pointer jump * fix optype comments * fix bug introduced while resolving conflict * change cmake option for kunlunxin xpu from 'xpu' to 'kunlun'; fix bug after merging distributed infrastructure * Add doc support for xpu (#141) * fix * fix * fix pooling test * format * format * fix * fix * set cmake version requirement * fix cmakelists * rename xpu to kunlun * fix * fix format * fix format * fix format * fix change name to kunlun * format * fix format * clang format * fix format --------- Co-authored-by: root <root@localhost.localdomain> Co-authored-by: wanghailu <wanghailu@qiyuanlab.com> Co-authored-by: wanghailu <wanghailu0717@163.com> Co-authored-by: Bolun Zhang <48948016+Chamberlain0w0@users.noreply.github.com> Co-authored-by: Bolun <bolunz@u.nus.edu> Co-authored-by: zhangyue207 <138768300+zhangyue207@users.noreply.github.com> Co-authored-by: Haojie Wang <haojie0429@gmail.com> Co-authored-by: baominghelly <41820386+baominghelly@users.noreply.github.com> Co-authored-by: Bolun <chamberlain0w0@gmail.com> 2023-10-16 10:57:08 +08:00			`#pragma once`
			`#include "core/kernel.h"`
			`#include "kunlun/kunlun_runtime.h"`

			`namespace infini {`

			`class KUNLUNKernelWithoutConfig : public Kernel {`
			`public:`
			`virtual void compute(const Operator &op, const PerfRecord &record,`
			`const RuntimeObj *context) const {`
			`compute(op, context);`
			`}`
			`virtual void compute(const Operator &op,`
			`const RuntimeObj *context) const = 0;`
			`// Premise: op is idempotent since it is called multiple times.`
			`virtual PerfRecord tune(const Operator &op,`
			`const RuntimeObj *_context) const {`
			`auto context = dynamic_cast<const KUNLUNRuntimeObj *>(_context);`
			`return make_ref<PerfRecordObj>(timeit([&]() { compute(op, _context); },`
			`[&]() { context->sync(); }));`
			`}`
			`};`

			`} // namespace infini`