TIM-VX/src/tim/vx/graph.cc

208 lines
6.8 KiB
C++

/****************************************************************************
*
* Copyright (c) 2020 Vivante Corporation
*
* Permission is hereby granted, free of charge, to any person obtaining a
* copy of this software and associated documentation files (the "Software"),
* to deal in the Software without restriction, including without limitation
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
* and/or sell copies of the Software, and to permit persons to whom the
* Software is furnished to do so, subject to the following conditions:
*
* The above copyright notice and this permission notice shall be included in
* all copies or substantial portions of the Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
* DEALINGS IN THE SOFTWARE.
*
*****************************************************************************/
#include "tim/vx/graph.h"
#include <algorithm>
#include "context_private.h"
#include "graph_private.h"
#include "op_impl.h"
#include "tensor_private.h"
#include "tim/vx/context.h"
#include "tim/vx/ops/nbg.h"
#include "tim/vx/compile_option.h"
#include "vsi_nn_pub.h"
namespace tim {
namespace vx {
const std::vector<std::shared_ptr<Tensor>> Graph::GetConstantInputs() const {
std::vector<std::shared_ptr<Tensor>> const_inputs;
for (auto op : op_vector_) {
auto const_i = op->ConstantInputsTensor();
const_inputs.insert(const_inputs.end(), const_i.begin(), const_i.end());
}
return const_inputs;
}
GraphImpl::GraphImpl(ContextImpl* context, const CompileOption& options)
: context_(context),
graph_(vsi_nn_CreateGraph(context_->context(), 0, 0)),
tensor_placeholder_(nullptr),
options_(options){}
GraphImpl::~GraphImpl() { vsi_nn_ReleaseGraph(&graph_); }
vsi_nn_graph_t* GraphImpl::graph() { return graph_; }
void GraphImpl::AddInput(vsi_nn_tensor_id_t id) {
if (inputs_.end() == std::find(inputs_.begin(), inputs_.end(), id)) {
inputs_.push_back(id);
}
}
void GraphImpl::AddOutput(vsi_nn_tensor_id_t id) {
if (outputs_.end() == std::find(outputs_.begin(), outputs_.end(), id)) {
outputs_.push_back(id);
}
}
void GraphImpl::AddInput(const std::shared_ptr<Tensor>& tensor) {
if (inputs_tensor_.end() ==
std::find(inputs_tensor_.begin(), inputs_tensor_.end(), tensor)) {
inputs_tensor_.push_back(tensor);
}
}
void GraphImpl::AddOutput(const std::shared_ptr<Tensor>& tensor) {
if (outputs_tensor_.end() ==
std::find(outputs_tensor_.begin(), outputs_tensor_.end(), tensor)) {
outputs_tensor_.push_back(tensor);
}
}
const std::vector<std::shared_ptr<Tensor>> GraphImpl::InputsTensor() const {
return inputs_tensor_;
}
const std::vector<std::shared_ptr<Tensor>> GraphImpl::OutputsTensor() const {
return outputs_tensor_;
}
void GraphImpl::UpdateTensorConsumersMap(const std::shared_ptr<Tensor>& tensor,
const Operation* op) {
for (const auto& added_op : op_vector_) {
if (added_op.get() == op) {
tensor_consumers_[tensor].push_back(added_op);
}
}
}
void GraphImpl::UpdateTensorProducerMap(const std::shared_ptr<Tensor>& tensor,
const Operation* op) {
for (const auto& added_op : op_vector_) {
if (added_op.get() == op) {
tensor_producer_[tensor] = added_op;
}
}
}
const std::vector<std::shared_ptr<Operation>> GraphImpl::GetConsumersOp(
std::shared_ptr<Tensor> tensor) const {
auto consumers = tensor_consumers_.find(tensor);
if (tensor_consumers_.end() != consumers) {
return consumers->second;
} else {
VSILOGD("Tensor has no consumers, may be graph output.");
return {};
}
}
std::shared_ptr<Operation> GraphImpl::GetProducerOp(
std::shared_ptr<Tensor> tensor) {
auto producer = tensor_producer_.find(tensor);
if (tensor_producer_.end() != producer) {
return producer->second;
} else {
VSILOGD("Tensor has no producer, may be graph input.");
return {};
}
}
void GraphImpl::PrintGraph() const { vsi_nn_PrintGraph(this->graph_); }
std::shared_ptr<Tensor> GraphImpl::CreateTensor(const TensorSpec& spec,
const void* data) {
return std::make_shared<TensorImpl>(this, spec, data);
}
std::shared_ptr<Tensor> GraphImpl::CreateTensor(const TensorSpec& spec,
const DmaBufferDesc& dmafd) {
return std::make_shared<TensorImpl>(this, spec, dmafd);
}
std::shared_ptr<Tensor> GraphImpl::CreateTensorPlaceHolder() {
if (!tensor_placeholder_) {
tensor_placeholder_ = std::make_shared<TensorPlaceholder>(this);
}
return tensor_placeholder_;
}
bool GraphImpl::Compile() {
bool status = true;
auto major = vsi_nn_GetVersionMajor();
auto minor = vsi_nn_GetVersionMinor();
auto patch = vsi_nn_GetVersionPatch();
vsi_nn_SetGraphVersion(graph_, major, minor, patch);
bool is_fast_mode = options_.isRelaxMode();
if (is_fast_mode) {
VSILOGW("Important notice: float model executed in bfloat16 "
"mode which will have better performance but lower precesion");
}
vsi_nn_SetGraphFastMode(graph_, is_fast_mode);
std::call_once(setio_once_, [&status, this]() {
status = (vsi_nn_SetGraphInputs(this->graph_, this->inputs_.data(),
this->inputs_.size()) &&
vsi_nn_SetGraphOutputs(this->graph_, this->outputs_.data(),
this->outputs_.size()));
});
std::call_once(setup_once_, [&status, this]() {
status = (VSI_SUCCESS == vsi_nn_SetupGraph(this->graph_, true));
});
std::call_once(verify_graph_once_, [&status, this]() {
status = (VSI_SUCCESS == vsi_nn_VerifyGraph(this->graph_));
});
return status;
}
bool GraphImpl::CompileToBinary(void* buf, size_t* size) {
bool status = true;
std::call_once(setio_once_, [&status, this]() {
status = (vsi_nn_SetGraphInputs(this->graph_, this->inputs_.data(),
this->inputs_.size()) &&
vsi_nn_SetGraphOutputs(this->graph_, this->outputs_.data(),
this->outputs_.size()));
});
std::call_once(setup_once_, [&status, this]() {
status = (VSI_SUCCESS == vsi_nn_SetupGraph(this->graph_, true));
});
return ((status) && (VSI_SUCCESS == vsi_nn_GenerateNBG(graph_, buf, size)));
}
bool GraphImpl::Run() {
return ((Compile()) && (VSI_SUCCESS == vsi_nn_RunGraph(graph_)));
}
} // namespace vx
} // namespace tim