Files
FastDeploy/third_party/optimizer/onnxoptimizer/passes/fuse_transpose_into_gemm.h
Jason 6343b0db47 [Build] Support build with source code of Paddle2ONNX (#1559)
* Add notes for tensors

* Optimize some apis

* move some warnings

* Support build with Paddle2ONNX

* Add protobuf support

* Fix compile on mac

* add clearn package script

* Add paddle2onnx code

* remove submodule

* Add onnx ocde

* remove softlink

* add onnx code

* fix error

* Add cmake file

* fix patchelf

* update paddle2onnx

* Delete .gitmodules

---------

Co-authored-by: PaddleCI <paddle_ci@example.com>
Co-authored-by: pangyoki <pangyoki@126.com>
Co-authored-by: jiangjiajun <jiangjiajun@baidu.lcom>
2023-03-17 10:03:22 +08:00

49 lines
1.4 KiB
C++

/*
* SPDX-License-Identifier: Apache-2.0
*/
// ATTENTION: The code in this file is highly EXPERIMENTAL.
// Adventurous users should note that the APIs will probably change.
#pragma once
#include "onnxoptimizer/pass.h"
namespace ONNX_NAMESPACE {
namespace optimization {
struct FuseTransposeIntoGemm final : public PredicateBasedPass {
explicit FuseTransposeIntoGemm()
: PredicateBasedPass(PassType::Fuse, PassEfficiency::Complete,
PassOptimizationType::Compute) {}
std::string getPassName() const override {
return "fuse_transpose_into_gemm";
}
bool patternMatchPredicate(Node* node) override {
return node->kind() == kGemm;
}
bool runTransform(Node* n, Graph&,
NodeDestroyType& destroy_current) override {
const std::vector<int64_t> simple_trans_perm({1, 0});
destroy_current = NodeDestroyType::DestroyZero;
bool ret_val = false;
for (size_t i : {0, 1}) {
auto inp = n->inputs()[i];
auto trans = i == 0 ? ktransA : ktransB;
if (inp->node()->kind() == kTranspose &&
inp->node()->is(kperm) == simple_trans_perm) {
n->replaceInput(i, inp->node()->input());
n->i_(trans, n->hasAttribute(trans) ? !n->i(trans) : 1);
if (inp->uses().size() == 0) {
inp->node()->destroy();
ret_val = true;
}
}
}
return ret_val;
}
};
} // namespace optimization
} // namespace ONNX_NAMESPACE