ncnn / tools /pnnx /src /pass_level3 /fuse_multiheadattention_unpack.cpp

thanks to ncnn ❤

be903e2 over 2 years ago

1.94 kB

	// Tencent is pleased to support the open source community by making ncnn available.
	//
	// Copyright (C) 2022 THL A29 Limited, a Tencent company. All rights reserved.
	//
	// Licensed under the BSD 3-Clause License (the "License"); you may not use this file except
	// in compliance with the License. You may obtain a copy of the License at
	//
	// https://opensource.org/licenses/BSD-3-Clause
	//
	// Unless required by applicable law or agreed to in writing, software distributed
	// under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR
	// CONDITIONS OF ANY KIND, either express or implied. See the License for the
	// specific language governing permissions and limitations under the License.

	#include "fuse_multiheadattention_unpack.h"
	#include <algorithm>
	#include "pass_level2.h"

	namespace pnnx {

	void fuse_multiheadattention_unpack(Graph& graph)
	{
	while (1)
	{
	bool matched = false;

	for (size_t i = 0; i < graph.ops.size(); i++)
	{
	Operator* op = graph.ops[i];

	if (op->type != "nn.MultiheadAttention")
	continue;

	if (op->outputs.size() != 1)
	continue;

	if (op->outputs[0]->consumers.size() != 1)
	continue;

	Operator* op2 = op->outputs[0]->consumers[0];
	if (op2->type != "prim::TupleUnpack")
	continue;

	matched = true;

	op->outputs[0]->producer = 0;
	op->outputs[0]->remove_consumer(op2);

	for (auto& x : op2->outputs)
	{
	x->producer = op;
	}

	op->outputs = op2->outputs;

	op2->inputs.clear();
	op2->outputs.clear();

	graph.ops.erase(std::find(graph.ops.begin(), graph.ops.end(), op2));

	delete op2;

	break;
	}

	if (!matched)
	break;
	}
	}

	} // namespace pnnx