forked from jiuyuan/InfiniTensor
Compare commits
merge into: p87291405:master
p87291405:master
p87291405:cuda-attention
p87291405:dev-leakyrelu
p87291405:instance_norm
p87291405:ascend
p87291405:cuda-transpose
p87291405:kvcache_backup
p87291405:kvcache_attention_fp16
p87291405:kunlun_temp
p87291405:dist/graph
p87291405:dist_bench
p87291405:bang-softmax
p87291405:dropout
p87291405:update_pybind11
p87291405:support_fp16
p87291405:add_paddle_model
p87291405:point2point
p87291405:NNET_231111_from_master
p87291405:NNET_231111
p87291405:allocator_memPool
p87291405:test_codegen
p87291405:change_path
p87291405:xpu_allreduce
p87291405:dev-dynamic-graph
p87291405:dev-dynamic-graph-allocator
p87291405:dump/init
p87291405:gpt
p87291405:nnet_e2e_for_merge
p87291405:gencode
p87291405:optimization-pass
p87291405:dev-memory
p87291405:conv_half
p87291405:benchmark_conv
p87291405:benchmark_softmax
p87291405:benchmark
p87291405:dcj/for_multiple_datatype
p87291405:Conv_NHWC
p87291405:NNET_bias
p87291405:NNET_bias_0630
p87291405:constroy/doc_on_ares
p87291405:pure_engine
p87291405:v0630
p87291405:NNET_e2e
p87291405:update_doc
p87291405:model_test
p87291405:TC_revision
p87291405:NNET_gcn
p87291405:NNET_op_test
p87291405:NNET_OpSearch
p87291405:NNET_gcn_fuse
p87291405:fsrcnn-conv-bias-act-fuse
p87291405:NNET_e2e_for_merge
p87291405:NNET_eliminateOP
p87291405:NNET_anyOp
p87291405:NNET_transpose
p87291405:cpu_backend2
p87291405:NNET_e2e_fix
p87291405:NNET_GAN
p87291405:test_onnx
p87291405:activation
p87291405:ddp
p87291405:search_engine
p87291405:power-fusion
p87291405:op_timer
p87291405:graph-onnx
p87291405:graphFactory
p87291405:case-fsrcnn
p87291405:testAccuracy
p87291405:train_wanghailu_1010
p87291405:broadcast_wanghailu_0916
jiuyuan:test-models
pull from: p87291405:master
p87291405:cuda-attention
p87291405:dev-leakyrelu
p87291405:instance_norm
p87291405:ascend
p87291405:cuda-transpose
p87291405:master
p87291405:kvcache_backup
p87291405:kvcache_attention_fp16
p87291405:kunlun_temp
p87291405:dist/graph
p87291405:dist_bench
p87291405:bang-softmax
p87291405:dropout
p87291405:update_pybind11
p87291405:support_fp16
p87291405:add_paddle_model
p87291405:point2point
p87291405:NNET_231111_from_master
p87291405:NNET_231111
p87291405:allocator_memPool
p87291405:test_codegen
p87291405:change_path
p87291405:xpu_allreduce
p87291405:dev-dynamic-graph
p87291405:dev-dynamic-graph-allocator
p87291405:dump/init
p87291405:gpt
p87291405:nnet_e2e_for_merge
p87291405:gencode
p87291405:optimization-pass
p87291405:dev-memory
p87291405:conv_half
p87291405:benchmark_conv
p87291405:benchmark_softmax
p87291405:benchmark
p87291405:dcj/for_multiple_datatype
p87291405:Conv_NHWC
p87291405:NNET_bias
p87291405:NNET_bias_0630
p87291405:constroy/doc_on_ares
p87291405:pure_engine
p87291405:v0630
p87291405:NNET_e2e
p87291405:update_doc
p87291405:model_test
p87291405:TC_revision
p87291405:NNET_gcn
p87291405:NNET_op_test
p87291405:NNET_OpSearch
p87291405:NNET_gcn_fuse
p87291405:fsrcnn-conv-bias-act-fuse
p87291405:NNET_e2e_for_merge
p87291405:NNET_eliminateOP
p87291405:NNET_anyOp
p87291405:NNET_transpose
p87291405:cpu_backend2
p87291405:NNET_e2e_fix
p87291405:NNET_GAN
p87291405:test_onnx
p87291405:activation
p87291405:ddp
p87291405:search_engine
p87291405:power-fusion
p87291405:op_timer
p87291405:graph-onnx
p87291405:graphFactory
p87291405:case-fsrcnn
p87291405:testAccuracy
p87291405:train_wanghailu_1010
p87291405:broadcast_wanghailu_0916
jiuyuan:code_generate
jiuyuan:support_ascend_fp16_zyz
jiuyuan:aug-cuda-op-need
jiuyuan:master
jiuyuan:fix_runtime
jiuyuan:support_ascend_fp16
jiuyuan:cxjj
jiuyuan:fix_fp16_matmul
jiuyuan:bang-rmsnorm
jiuyuan:cuda-attention
jiuyuan:operator-test
jiuyuan:bang-rms-soft
jiuyuan:cuda-transpose
jiuyuan:add_leaky_relu
jiuyuan:instance_norm
jiuyuan:kvcache_backup
jiuyuan:kvcache_attention_fp16
jiuyuan:kunlun_temp
jiuyuan:dist/graph
jiuyuan:dist_bench
jiuyuan:dropout
jiuyuan:update_pybind11
jiuyuan:support_fp16
jiuyuan:add_paddle_model
jiuyuan:point2point
jiuyuan:NNET_231111_from_master
jiuyuan:NNET_231111
jiuyuan:allocator_memPool
jiuyuan:test_codegen
jiuyuan:change_path
jiuyuan:xpu_allreduce
jiuyuan:dev-dynamic-graph
jiuyuan:dev-dynamic-graph-allocator
jiuyuan:dump/init
jiuyuan:gpt
jiuyuan:nnet_e2e_for_merge
jiuyuan:gencode
jiuyuan:optimization-pass
jiuyuan:dev-memory
jiuyuan:conv_half
jiuyuan:benchmark_conv
jiuyuan:benchmark_softmax
jiuyuan:benchmark
jiuyuan:dcj/for_multiple_datatype
jiuyuan:Conv_NHWC
jiuyuan:NNET_bias
jiuyuan:NNET_bias_0630
jiuyuan:constroy/doc_on_ares
jiuyuan:pure_engine
jiuyuan:v0630
jiuyuan:NNET_e2e
jiuyuan:update_doc
jiuyuan:model_test
jiuyuan:TC_revision
jiuyuan:NNET_gcn
jiuyuan:NNET_op_test
jiuyuan:NNET_OpSearch
jiuyuan:NNET_gcn_fuse
jiuyuan:fsrcnn-conv-bias-act-fuse
jiuyuan:NNET_e2e_for_merge
jiuyuan:NNET_eliminateOP
jiuyuan:NNET_anyOp
jiuyuan:NNET_transpose
jiuyuan:cpu_backend2
jiuyuan:NNET_e2e_fix
jiuyuan:NNET_GAN
jiuyuan:test_onnx
jiuyuan:activation
jiuyuan:ddp
jiuyuan:search_engine
jiuyuan:power-fusion
jiuyuan:op_timer
jiuyuan:graph-onnx
jiuyuan:graphFactory
jiuyuan:case-fsrcnn
jiuyuan:testAccuracy
jiuyuan:train_wanghailu_1010
jiuyuan:broadcast_wanghailu_0916
jiuyuan:test-models
These branches are equal. There is no need to create a pull request.