forked from mindspore-Ecosystem/mindspore
!13764 [MS][LITE] remove param value lite
From: @jianghui58 Reviewed-by: Signed-off-by:
This commit is contained in:
commit
d17b2c98e3
|
@ -1,79 +0,0 @@
|
|||
/**
|
||||
* Copyright 2020 Huawei Technologies Co., Ltd
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
#ifndef MINDSPORE_LITE_SRC_PARAM_VALUE_LITE_H_
|
||||
#define MINDSPORE_LITE_SRC_PARAM_VALUE_LITE_H_
|
||||
|
||||
#include <memory>
|
||||
#include <algorithm>
|
||||
#include <vector>
|
||||
#include <utility>
|
||||
#include "src/tensor.h"
|
||||
|
||||
namespace mindspore {
|
||||
class ParamValueLite : public Value {
|
||||
public:
|
||||
ParamValueLite() : tensor_addr_(nullptr), tensor_size_(0) {}
|
||||
~ParamValueLite() override {
|
||||
if (tensor_addr_ != nullptr) {
|
||||
auto tensor_mem = reinterpret_cast<char *>(tensor_addr_);
|
||||
delete[](tensor_mem);
|
||||
tensor_addr_ = nullptr;
|
||||
tensor_size_ = 0;
|
||||
}
|
||||
}
|
||||
MS_DECLARE_PARENT(ParamValueLite, Value)
|
||||
size_t tensor_size() const { return tensor_size_; }
|
||||
void set_tensor_size(const size_t size) { tensor_size_ = size; }
|
||||
void *tensor_addr() const { return tensor_addr_; }
|
||||
void set_tensor_addr(void *addr) { tensor_addr_ = addr; }
|
||||
|
||||
std::vector<int> tensor_shape() const { return tensor_shape_; }
|
||||
void set_tensor_shape(const std::vector<int> &tensor_shape) { tensor_shape_ = tensor_shape; }
|
||||
|
||||
TypeId tensor_type() const { return type_id_; }
|
||||
void set_tensor_type(const TypeId type_id) { type_id_ = type_id; }
|
||||
|
||||
void SetTensorData(void *addr, const size_t size) {
|
||||
this->tensor_addr_ = addr;
|
||||
this->tensor_size_ = size;
|
||||
}
|
||||
|
||||
int tensor_shape_size() const {
|
||||
int size = 1;
|
||||
for (auto val : tensor_shape_) {
|
||||
size *= val;
|
||||
}
|
||||
return size;
|
||||
}
|
||||
|
||||
bool operator==(const Value &other) const override { return this == &other; }
|
||||
|
||||
int format() const { return this->format_; }
|
||||
|
||||
void set_format(int format) { this->format_ = format; }
|
||||
|
||||
private:
|
||||
void *tensor_addr_ = nullptr;
|
||||
size_t tensor_size_ = 0;
|
||||
int format_ = schema::Format::Format_KCHW;
|
||||
std::vector<int> tensor_shape_{};
|
||||
TypeId type_id_ = TypeId::kNumberTypeFloat32;
|
||||
};
|
||||
|
||||
using ParamValueLitePtr = std::shared_ptr<ParamValueLite>;
|
||||
} // namespace mindspore
|
||||
#endif // MINDSPORE_LITE_SRC_PARAM_VALUE_LITE_H_
|
|
@ -152,11 +152,7 @@ set(TEST_LITE_SRC
|
|||
${LITE_DIR}/src/common/file_utils.cc
|
||||
${LITE_DIR}/src/common/utils.cc
|
||||
${LITE_DIR}/src/common/string_util.cc
|
||||
${LITE_DIR}/tools/common/graph_util.cc
|
||||
${LITE_DIR}/tools/common/tensor_util.cc
|
||||
${LITE_DIR}/tools/common/node_util.cc
|
||||
${LITE_DIR}/tools/common/flag_parser.cc
|
||||
${LITE_DIR}/tools/common/storage.cc
|
||||
${LITE_DIR}/tools/benchmark/benchmark.cc
|
||||
${LITE_DIR}/test/st/benchmark_test.cc
|
||||
${LITE_DIR}/src/errorcode.cc
|
||||
|
@ -271,6 +267,10 @@ if(ENABLE_CONVERTER)
|
|||
${LITE_DIR}/tools/optimizer/graph/functionalize_cond.cc
|
||||
${LITE_DIR}/tools/optimizer/graph/inputs_adjust_pass.cc
|
||||
${LITE_DIR}/tools/optimizer/graph/primitive_adjust_pass.cc
|
||||
${LITE_DIR}/tools/common/graph_util.cc
|
||||
${LITE_DIR}/tools/common/tensor_util.cc
|
||||
${LITE_DIR}/tools/common/node_util.cc
|
||||
${LITE_DIR}/tools/common/storage.cc
|
||||
)
|
||||
endif()
|
||||
### train
|
||||
|
|
|
@ -18,12 +18,12 @@
|
|||
#include <algorithm>
|
||||
#include "schema/inner/model_generated.h"
|
||||
#include "frontend/operator/ops.h"
|
||||
#include "src/param_value_lite.h"
|
||||
#include "src/common/log_adapter.h"
|
||||
#include "tools/converter/converter_context.h"
|
||||
#include "include/errorcode.h"
|
||||
#include "test/common/import_from_meta_graphT.h"
|
||||
#include "ir/func_graph.h"
|
||||
#include "src/common/utils.h"
|
||||
#include "tools/common/tensor_util.h"
|
||||
|
||||
namespace mindspore::lite {
|
||||
AnfNodePtr AnfImporterFromMetaGraphT::GetNode(int tensor_id) {
|
||||
|
@ -50,41 +50,34 @@ int AnfImporterFromMetaGraphT::ConverterConstTensor() {
|
|||
std::copy(tensor->dims.begin(), tensor->dims.end(), shape.begin());
|
||||
auto type_id = static_cast<TypeId>(tensor->dataType);
|
||||
auto type_ptr = TypeIdToType(type_id);
|
||||
std::vector<int64_t> shape_vector;
|
||||
(void)std::transform(shape.begin(), shape.end(), std::back_inserter(shape_vector),
|
||||
[](const int32_t &value) { return static_cast<int64_t>(value); });
|
||||
auto abstract_tensor = std::make_shared<abstract::AbstractTensor>(type_ptr, shape_vector);
|
||||
MS_ASSERT(nullptr != abstract_tensor);
|
||||
parameter->set_abstract(abstract_tensor);
|
||||
std::vector<int64_t> shape_vector(shape.begin(), shape.end());
|
||||
if (!tensor->name.empty()) {
|
||||
parameter->set_name(tensor->name);
|
||||
} else {
|
||||
parameter->set_name("const-" + std::to_string(i));
|
||||
}
|
||||
|
||||
ParamValueLitePtr param_value = std::make_shared<ParamValueLite>();
|
||||
MS_ASSERT(nullptr != param_value);
|
||||
param_value->set_tensor_shape(shape);
|
||||
param_value->set_tensor_type(type_id);
|
||||
param_value->set_format(tensor->format);
|
||||
tensor::TensorPtr tensor_info = std::make_shared<tensor::Tensor>(type_id, shape_vector);
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "create tensor info failed.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
int status = RET_OK;
|
||||
if (!tensor->data.empty()) {
|
||||
auto size = tensor->data.size();
|
||||
char *tensor_data = new (std::nothrow) char[size];
|
||||
if (tensor_data == nullptr) {
|
||||
MS_LOG(ERROR) << "new char[] failed";
|
||||
return RET_MEMORY_FAILED;
|
||||
}
|
||||
auto tensor_data = static_cast<char *>(tensor_info->data_c());
|
||||
auto ret = memcpy_s(tensor_data, size, tensor->data.data(), size);
|
||||
if (EOK != ret) {
|
||||
MS_LOG(ERROR) << "memcpy_s error";
|
||||
delete[] tensor_data;
|
||||
return RET_MEMORY_FAILED;
|
||||
}
|
||||
param_value->SetTensorData(tensor_data, size);
|
||||
parameter->set_default_param(param_value);
|
||||
status = lite::InitParameterFromTensorInfo(parameter, tensor_info);
|
||||
} else if (std::find(meta_graph_->inputIndex.begin(), meta_graph_->inputIndex.end(), i) ==
|
||||
meta_graph_->inputIndex.end()) {
|
||||
parameter->set_default_param(param_value);
|
||||
status = lite::InitParameterFromTensorInfo(parameter, tensor_info);
|
||||
}
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "init parameter from tensor info failed";
|
||||
return RET_ERROR;
|
||||
}
|
||||
AddNode(i, parameter);
|
||||
}
|
||||
|
|
|
@ -67,7 +67,7 @@ ml_video_edit_v10_best_model_nomean_20200723 8
|
|||
#hdc_ocr_detect.onnx 30 #too many subgraphs
|
||||
ml_edu_kit_hand_detection.onnx 1
|
||||
ml_edu_kit_hand_key_position.onnx 2
|
||||
ml_video_edit_oneclick_adaptis.pb 2 3
|
||||
#ml_video_edit_oneclick_adaptis.pb 2 3
|
||||
densenet.tflite 3
|
||||
resnet_v2_101_299.tflite 1
|
||||
ml_video_edit_enhance.pb 2
|
||||
|
|
|
@ -1,9 +1,9 @@
|
|||
ml_video_edit_video_segment_gauss_adaptis_part2_pb2tflite.tflite;2 11
|
||||
ml_video_edit_video_segment_gauss_adaptis_part2.pb;2 11
|
||||
ml_video_edit_video_segment_gauss_adaptis_part2.pb;2 12.3
|
||||
ml_video_edit_img_segment_adaptise.pb;2 40
|
||||
ml_video_edit_img_segment_adaptise_pb2tflite.tflite;2 0.5
|
||||
ml_video_edit_person_divison_video;2 38
|
||||
ml_video_edit_oneclick_adaptis.pb;3 6
|
||||
ml_video_edit_oneclick_adaptis.pb;3 6.1
|
||||
hdc_tb_cn_neg.tflite;3 281
|
||||
decoder_step_201217.pb;5 187
|
||||
ml_video_edit_art_transfer.onnx;3 3
|
||||
|
|
|
@ -21,6 +21,8 @@
|
|||
#include <utility>
|
||||
#include <vector>
|
||||
#include <algorithm>
|
||||
#include "tools/converter/converter_flags.h"
|
||||
#include "tools/common/tensor_util.h"
|
||||
#include "abstract/abstract_value.h"
|
||||
#include "mindspore/core/ir/primitive.h"
|
||||
#include "ops/fusion/partial_fusion.h"
|
||||
|
@ -32,8 +34,8 @@
|
|||
#include "tools/converter/quant_param_holder.h"
|
||||
#include "tools/optimizer/common/gllo_utils.h"
|
||||
#include "src/tensor.h"
|
||||
#include "src/param_value_lite.h"
|
||||
#include "src/common/utils.h"
|
||||
#include "ops/op_utils.h"
|
||||
#include "tools/common/graph_util.h"
|
||||
#include "src/ops/ops_utils.h"
|
||||
|
||||
|
@ -77,6 +79,51 @@ std::list<CNodePtr> GetOrderedCNodes(const FuncGraphPtr fg) {
|
|||
}
|
||||
return cnodes;
|
||||
}
|
||||
ShapeVector GetShapeVectorFromTensorInfo(const tensor::TensorPtr &tensor_info, size_t *offset) {
|
||||
ShapeVector shape_vector;
|
||||
auto tensor_data = reinterpret_cast<uint8_t *>(tensor_info->data_c());
|
||||
std::string shape_str;
|
||||
std::string shape_size_str;
|
||||
*offset = 0;
|
||||
size_t cnt = 0;
|
||||
for (; *offset < tensor_info->Size(); (*offset)++) {
|
||||
if (tensor_data[*offset] == ',') {
|
||||
(*offset)++;
|
||||
break;
|
||||
}
|
||||
shape_size_str.push_back(tensor_data[*offset]);
|
||||
}
|
||||
size_t shape_size = std::stoi(shape_size_str);
|
||||
for (; *offset < tensor_info->Size(); (*offset)++) {
|
||||
if (tensor_data[*offset] == ',') {
|
||||
cnt++;
|
||||
shape_vector.push_back(std::stoi(shape_str));
|
||||
shape_str.clear();
|
||||
} else {
|
||||
shape_str.push_back(tensor_data[*offset]);
|
||||
}
|
||||
if (cnt == shape_size) {
|
||||
(*offset)++;
|
||||
break;
|
||||
}
|
||||
}
|
||||
|
||||
return shape_vector;
|
||||
}
|
||||
schema::Format GetFormatByFmk(int32_t fmk_type) {
|
||||
switch (fmk_type) {
|
||||
case converter::FmkType_ONNX:
|
||||
case lite::converter::FmkType_CAFFE:
|
||||
case lite::converter::FmkType_MS:
|
||||
return schema::Format_NCHW;
|
||||
case lite::converter::FmkType_TF:
|
||||
case lite::converter::FmkType_TFLITE:
|
||||
return schema::Format_NHWC;
|
||||
default:
|
||||
MS_LOG(ERROR) << "don't support current fmk: " + fmk_type;
|
||||
return static_cast<schema::Format>(fmk_type);
|
||||
}
|
||||
}
|
||||
} // namespace
|
||||
|
||||
void AnfExporter::RemoveIfMakeTuple(const CNodePtr &cnode) {
|
||||
|
@ -164,9 +211,9 @@ int AnfExporter::ConvertQuantParam(const std::unique_ptr<schema::MetaGraphT> &me
|
|||
QuantParamsVector input_quant_params;
|
||||
QuantParamsVector output_quant_params;
|
||||
dst_node->quantType = schema::QuantType_QUANT_NONE;
|
||||
auto quant_param_valueptr = primitive->GetAttr("quant_params");
|
||||
if (quant_param_valueptr != nullptr) {
|
||||
auto quant_param_holder = quant_param_valueptr->cast<QuantParamHolderPtr>();
|
||||
auto quant_tensor_info_ptr = primitive->GetAttr("quant_params");
|
||||
if (quant_tensor_info_ptr != nullptr) {
|
||||
auto quant_param_holder = quant_tensor_info_ptr->cast<QuantParamHolderPtr>();
|
||||
if (quant_param_holder == nullptr) {
|
||||
MS_LOG(ERROR) << "quant param is invalid.";
|
||||
return RET_ERROR;
|
||||
|
@ -553,160 +600,174 @@ int AnfExporter::ConvertInputParameter(const std::shared_ptr<AnfNode> &input_ano
|
|||
const std::shared_ptr<PrimitiveC> &primitive_c,
|
||||
const std::unique_ptr<schema::MetaGraphT> &meta_graphT,
|
||||
schema::CNodeT *output_cnode) {
|
||||
auto paramNode = input_anode->cast<ParameterPtr>();
|
||||
std::string input_name = paramNode->fullname_with_scope();
|
||||
auto param_node = input_anode->cast<ParameterPtr>();
|
||||
std::string input_name = param_node->fullname_with_scope();
|
||||
if (node_id_map_.find(input_name) != node_id_map_.end()) {
|
||||
output_cnode->inputIndex.emplace_back(node_id_map_[paramNode->name()]);
|
||||
output_cnode->inputIndex.emplace_back(node_id_map_[param_node->name()]);
|
||||
return RET_OK;
|
||||
}
|
||||
auto paramTensor = std::make_unique<schema::TensorT>();
|
||||
paramTensor->format = schema::Format_NHWC;
|
||||
paramTensor->name = paramNode->name();
|
||||
auto abstractBase = paramNode->abstract();
|
||||
if (abstractBase == nullptr) {
|
||||
MS_LOG(ERROR) << "Abstract of parameter is nullptr, " << paramNode->name();
|
||||
auto schema_tensor = std::make_unique<schema::TensorT>();
|
||||
schema_tensor->format = GetFormatByFmk(meta_graphT->fmkType);
|
||||
if (schema_tensor->format != schema::Format_NHWC && schema_tensor->format != schema::Format_NCHW) {
|
||||
MS_LOG(ERROR) << "schema tensor format is wrong, " << schema_tensor->format;
|
||||
return RET_ERROR;
|
||||
}
|
||||
schema_tensor->name = param_node->name();
|
||||
auto abstract_base = param_node->abstract();
|
||||
if (abstract_base == nullptr) {
|
||||
MS_LOG(ERROR) << "Abstract of parameter is nullptr, " << param_node->name();
|
||||
return RET_PARAM_INVALID;
|
||||
}
|
||||
if (!utils::isa<abstract::AbstractTensorPtr>(abstractBase)) {
|
||||
MS_LOG(ERROR) << "Abstract of parameter should be anstract tensor, " << paramNode->name();
|
||||
if (!utils::isa<abstract::AbstractTensorPtr>(abstract_base)) {
|
||||
MS_LOG(ERROR) << "Abstract of parameter should be anstract tensor, " << param_node->name();
|
||||
return RET_INPUT_TENSOR_ERROR;
|
||||
}
|
||||
auto abstractTensor = utils::cast<abstract::AbstractTensorPtr>(abstractBase);
|
||||
auto typePtr = abstractTensor->element()->GetTypeTrack();
|
||||
auto abstract_tensor = utils::cast<abstract::AbstractTensorPtr>(abstract_base);
|
||||
auto typePtr = abstract_tensor->element()->GetTypeTrack();
|
||||
MS_ASSERT(typePtr != nullptr);
|
||||
paramTensor->dataType = typePtr->type_id();
|
||||
if (!utils::isa<abstract::ShapePtr>(abstractTensor->BuildShape())) {
|
||||
MS_LOG(ERROR) << "Shape of Abstract of parameter should be ShapePtr, " << paramNode->name();
|
||||
schema_tensor->dataType = typePtr->type_id();
|
||||
if (!utils::isa<abstract::ShapePtr>(abstract_tensor->BuildShape())) {
|
||||
MS_LOG(ERROR) << "Shape of Abstract of parameter should be ShapePtr, " << param_node->name();
|
||||
return RET_PARAM_INVALID;
|
||||
}
|
||||
auto shape_vector = utils::cast<abstract::ShapePtr>(abstractTensor->BuildShape())->shape();
|
||||
auto tensor_info = std::dynamic_pointer_cast<tensor::Tensor>(param_node->default_param());
|
||||
auto shape_vector = utils::cast<abstract::ShapePtr>(abstract_tensor->BuildShape())->shape();
|
||||
size_t offset = 0;
|
||||
if (!shape_vector.empty() && schema_tensor->dataType == kObjectTypeString) {
|
||||
shape_vector = GetShapeVectorFromTensorInfo(tensor_info, &offset);
|
||||
}
|
||||
std::vector<int32_t> dims;
|
||||
(void)std::transform(shape_vector.begin(), shape_vector.end(), std::back_inserter(dims),
|
||||
[](const int64_t &value) { return static_cast<int32_t>(value); });
|
||||
paramTensor->dims = dims;
|
||||
auto paramValue = std::dynamic_pointer_cast<ParamValueLite>(paramNode->default_param());
|
||||
if (paramValue != nullptr && paramValue->tensor_size() != 0) {
|
||||
paramTensor->data.resize(paramValue->tensor_size());
|
||||
paramTensor->format = schema::Format(paramValue->format());
|
||||
if (EOK != memcpy_s(paramTensor->data.data(), paramTensor->data.size(), paramValue->tensor_addr(),
|
||||
paramValue->tensor_size())) {
|
||||
MS_LOG(ERROR) << "memcpy_s failed.";
|
||||
return RET_ERROR;
|
||||
schema_tensor->dims = dims;
|
||||
if (tensor_info != nullptr && tensor_info->Size() != 0) {
|
||||
if (schema_tensor->dataType == kObjectTypeTensorType && shape_vector.empty() &&
|
||||
meta_graphT->fmkType == converter::FmkType_ONNX) {
|
||||
schema_tensor->data.resize(0);
|
||||
} else {
|
||||
schema_tensor->data.resize(tensor_info->Size() - offset);
|
||||
if (EOK != memcpy_s(schema_tensor->data.data(), schema_tensor->data.size(),
|
||||
static_cast<uint8_t *>(tensor_info->data_c()) + offset, tensor_info->Size() - offset)) {
|
||||
MS_LOG(ERROR) << "memcpy_s failed.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
paramTensor->name = input_name;
|
||||
if (primitive_c->GetAttr(opt::kWeightFormat) != nullptr) {
|
||||
schema_tensor->format = static_cast<schema::Format>(GetValue<int64_t>(primitive_c->GetAttr(opt::kWeightFormat)));
|
||||
}
|
||||
schema_tensor->name = input_name;
|
||||
QuantParamHolderPtr quant_param_holder = primitive_c->GetAttr("quant_params") == nullptr
|
||||
? nullptr
|
||||
: primitive_c->GetAttr("quant_params")->cast<QuantParamHolderPtr>();
|
||||
if (quant_param_holder != nullptr && quant_param_holder->enable_huffman_code() &&
|
||||
paramTensor->dataType == kNumberTypeInt8) {
|
||||
paramTensor->enableHuffmanCode = true;
|
||||
schema_tensor->dataType == kNumberTypeInt8) {
|
||||
schema_tensor->enableHuffmanCode = true;
|
||||
}
|
||||
node_id_map_[input_name] = meta_graphT->allTensors.size();
|
||||
output_cnode->inputIndex.emplace_back(meta_graphT->allTensors.size());
|
||||
meta_graphT->allTensors.emplace_back(std::move(paramTensor));
|
||||
meta_graphT->allTensors.emplace_back(std::move(schema_tensor));
|
||||
return RET_OK;
|
||||
}
|
||||
|
||||
int AnfExporter::ProcessTensor(const ValueNodePtr &valueNode, std::unique_ptr<schema::TensorT> *paramTensor,
|
||||
int AnfExporter::ProcessTensor(const ValueNodePtr &value_node, std::unique_ptr<schema::TensorT> *schema_tensor,
|
||||
const std::shared_ptr<Value> &value, schema::CNodeT *output_cnode,
|
||||
const std::unique_ptr<schema::MetaGraphT> &meta_graphT) {
|
||||
int ret;
|
||||
auto valueAbstract = valueNode->abstract();
|
||||
auto abstractTensor = utils::cast<abstract::AbstractTensorPtr>(valueAbstract);
|
||||
if (abstractTensor == nullptr || abstractTensor->element() == nullptr) {
|
||||
MS_LOG(ERROR) << "abstractTensor or abstractTensor->element() is nullptr";
|
||||
auto valueAbstract = value_node->abstract();
|
||||
auto abstract_tensor = utils::cast<abstract::AbstractTensorPtr>(valueAbstract);
|
||||
if (abstract_tensor == nullptr || abstract_tensor->element() == nullptr) {
|
||||
MS_LOG(ERROR) << "abstract_tensor or abstract_tensor->element() is nullptr";
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto typePtr = abstractTensor->element()->GetTypeTrack();
|
||||
(*paramTensor)->dataType = typePtr->type_id();
|
||||
auto shape_vector = utils::cast<abstract::ShapePtr>(abstractTensor->BuildShape())->shape();
|
||||
auto typePtr = abstract_tensor->element()->GetTypeTrack();
|
||||
(*schema_tensor)->dataType = typePtr->type_id();
|
||||
auto shape_vector = utils::cast<abstract::ShapePtr>(abstract_tensor->BuildShape())->shape();
|
||||
std::vector<int32_t> dims;
|
||||
(void)std::transform(shape_vector.begin(), shape_vector.end(), std::back_inserter(dims),
|
||||
[](const int64_t &value) { return static_cast<int32_t>(value); });
|
||||
(*paramTensor)->dims = dims;
|
||||
if (train_flag_ && (*paramTensor)->dims.empty()) (*paramTensor)->dims = {1};
|
||||
(*paramTensor)->nodeType = NodeType_ValueNode;
|
||||
(*schema_tensor)->dims = dims;
|
||||
if (train_flag_ && (*schema_tensor)->dims.empty()) (*schema_tensor)->dims = {1};
|
||||
(*schema_tensor)->nodeType = NodeType_ValueNode;
|
||||
auto data = value->cast<tensor::TensorPtr>();
|
||||
(*paramTensor)->data.resize(data->Size());
|
||||
ret = memcpy_s((*paramTensor)->data.data(), data->Size(), data->data_c(), data->Size());
|
||||
(*schema_tensor)->data.resize(data->Size());
|
||||
ret = memcpy_s((*schema_tensor)->data.data(), data->Size(), data->data_c(), data->Size());
|
||||
if (ret != EOK) {
|
||||
MS_LOG(ERROR) << "memcpy_s error.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
node_id_map_[valueNode->fullname_with_scope()] = meta_graphT->allTensors.size();
|
||||
node_id_map_[value_node->fullname_with_scope()] = meta_graphT->allTensors.size();
|
||||
output_cnode->inputIndex.emplace_back(meta_graphT->allTensors.size());
|
||||
meta_graphT->allTensors.emplace_back(std::move(*paramTensor));
|
||||
meta_graphT->allTensors.emplace_back(std::move(*schema_tensor));
|
||||
return ret;
|
||||
}
|
||||
int AnfExporter::ProcessInt32OrInt64Imm(const ValueNodePtr &valueNode, std::unique_ptr<schema::TensorT> *paramTensor,
|
||||
int AnfExporter::ProcessInt32OrInt64Imm(const ValueNodePtr &value_node, std::unique_ptr<schema::TensorT> *schema_tensor,
|
||||
const std::shared_ptr<Value> &value, schema::CNodeT *output_cnode,
|
||||
const std::unique_ptr<schema::MetaGraphT> &meta_graphT) {
|
||||
int ret;
|
||||
// data of int64 is converted to int32 here.
|
||||
(*paramTensor)->dataType = kNumberTypeInt32;
|
||||
(*paramTensor)->dims = {1};
|
||||
(*paramTensor)->nodeType = NodeType_ValueNode;
|
||||
(*schema_tensor)->dataType = kNumberTypeInt32;
|
||||
(*schema_tensor)->dims = {1};
|
||||
(*schema_tensor)->nodeType = NodeType_ValueNode;
|
||||
int real_data = opt::CastToInt(value).front();
|
||||
(*paramTensor)->data.resize(sizeof(int32_t));
|
||||
ret = memcpy_s((*paramTensor)->data.data(), sizeof(int32_t), &real_data, sizeof(int32_t));
|
||||
(*schema_tensor)->data.resize(sizeof(int32_t));
|
||||
ret = memcpy_s((*schema_tensor)->data.data(), sizeof(int32_t), &real_data, sizeof(int32_t));
|
||||
if (ret != EOK) {
|
||||
MS_LOG(ERROR) << "memcpy_s error.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
node_id_map_[valueNode->fullname_with_scope()] = meta_graphT->allTensors.size();
|
||||
node_id_map_[value_node->fullname_with_scope()] = meta_graphT->allTensors.size();
|
||||
output_cnode->inputIndex.emplace_back(meta_graphT->allTensors.size());
|
||||
meta_graphT->allTensors.emplace_back(std::move(*paramTensor));
|
||||
meta_graphT->allTensors.emplace_back(std::move(*schema_tensor));
|
||||
return ret;
|
||||
}
|
||||
void AnfExporter::ProcessBoolImm(const ValueNodePtr &valueNode, std::unique_ptr<schema::TensorT> *paramTensor,
|
||||
void AnfExporter::ProcessBoolImm(const ValueNodePtr &value_node, std::unique_ptr<schema::TensorT> *schema_tensor,
|
||||
const std::shared_ptr<Value> &value, schema::CNodeT *output_cnode,
|
||||
const std::unique_ptr<schema::MetaGraphT> &meta_graphT) {
|
||||
auto valueAbstract = valueNode->abstract();
|
||||
auto valueAbstract = value_node->abstract();
|
||||
auto abstractScalar = utils::cast<abstract::AbstractScalarPtr>(valueAbstract);
|
||||
auto typePtr = abstractScalar->GetTypeTrack();
|
||||
(*paramTensor)->dataType = typePtr->type_id();
|
||||
(*paramTensor)->dims = {1};
|
||||
(*paramTensor)->nodeType = NodeType_ValueNode;
|
||||
(*schema_tensor)->dataType = typePtr->type_id();
|
||||
(*schema_tensor)->dims = {1};
|
||||
(*schema_tensor)->nodeType = NodeType_ValueNode;
|
||||
auto data = value->cast<mindspore::BoolImmPtr>();
|
||||
(*paramTensor)->data.emplace_back(data->value());
|
||||
node_id_map_[valueNode->fullname_with_scope()] = meta_graphT->allTensors.size();
|
||||
(*schema_tensor)->data.emplace_back(data->value());
|
||||
node_id_map_[value_node->fullname_with_scope()] = meta_graphT->allTensors.size();
|
||||
output_cnode->inputIndex.emplace_back(meta_graphT->allTensors.size());
|
||||
meta_graphT->allTensors.emplace_back(std::move(*paramTensor));
|
||||
meta_graphT->allTensors.emplace_back(std::move(*schema_tensor));
|
||||
}
|
||||
int AnfExporter::ProcessNumber(const ValueNodePtr &valueNode, schema::TensorT *paramTensor,
|
||||
int AnfExporter::ProcessNumber(const ValueNodePtr &value_node, schema::TensorT *schema_tensor,
|
||||
schema::CNodeT *output_cnode, const std::unique_ptr<schema::MetaGraphT> &meta_graphT) {
|
||||
auto data = valueNode->value()->cast<NumberPtr>();
|
||||
paramTensor->data.resize(sizeof(int));
|
||||
auto data = value_node->value()->cast<NumberPtr>();
|
||||
schema_tensor->data.resize(sizeof(int));
|
||||
int number_type = data->number_type();
|
||||
if (EOK != ::memcpy_s(paramTensor->data.data(), sizeof(int), &number_type, sizeof(int))) {
|
||||
if (EOK != ::memcpy_s(schema_tensor->data.data(), sizeof(int), &number_type, sizeof(int))) {
|
||||
MS_LOG(ERROR) << "memcpy_s failed";
|
||||
return RET_MEMORY_FAILED;
|
||||
}
|
||||
paramTensor->dataType = kNumberTypeInt32;
|
||||
paramTensor->dims = {1};
|
||||
paramTensor->nodeType = NodeType_ValueNode;
|
||||
node_id_map_[valueNode->fullname_with_scope()] = meta_graphT->allTensors.size();
|
||||
schema_tensor->dataType = kNumberTypeInt32;
|
||||
schema_tensor->dims = {1};
|
||||
schema_tensor->nodeType = NodeType_ValueNode;
|
||||
node_id_map_[value_node->fullname_with_scope()] = meta_graphT->allTensors.size();
|
||||
output_cnode->inputIndex.emplace_back(meta_graphT->allTensors.size());
|
||||
meta_graphT->allTensors.emplace_back(paramTensor);
|
||||
meta_graphT->allTensors.emplace_back(schema_tensor);
|
||||
return RET_OK;
|
||||
}
|
||||
void AnfExporter::ProcessInt(const ValueNodePtr &valueNode, std::unique_ptr<schema::TensorT> *paramTensor,
|
||||
void AnfExporter::ProcessInt(const ValueNodePtr &value_node, std::unique_ptr<schema::TensorT> *schema_tensor,
|
||||
schema::CNodeT *output_cnode, const std::unique_ptr<schema::MetaGraphT> &meta_graphT) {
|
||||
(*paramTensor)->dataType = kNumberTypeInt32;
|
||||
(*paramTensor)->dims = {1};
|
||||
(*paramTensor)->nodeType = NodeType_ValueNode;
|
||||
(*paramTensor)->data.emplace_back(kNumberTypeInt32);
|
||||
node_id_map_[valueNode->fullname_with_scope()] = meta_graphT->allTensors.size();
|
||||
(*schema_tensor)->dataType = kNumberTypeInt32;
|
||||
(*schema_tensor)->dims = {1};
|
||||
(*schema_tensor)->nodeType = NodeType_ValueNode;
|
||||
(*schema_tensor)->data.emplace_back(kNumberTypeInt32);
|
||||
node_id_map_[value_node->fullname_with_scope()] = meta_graphT->allTensors.size();
|
||||
output_cnode->inputIndex.emplace_back(meta_graphT->allTensors.size());
|
||||
meta_graphT->allTensors.emplace_back(std::move(*paramTensor));
|
||||
meta_graphT->allTensors.emplace_back(std::move(*schema_tensor));
|
||||
}
|
||||
int AnfExporter::ProcessValueSequence(const ValueNodePtr &valueNode, std::unique_ptr<schema::TensorT> *paramTensor,
|
||||
int AnfExporter::ProcessValueSequence(const ValueNodePtr &value_node, std::unique_ptr<schema::TensorT> *schema_tensor,
|
||||
const std::shared_ptr<Value> &value, schema::CNodeT *output_cnode,
|
||||
const std::unique_ptr<schema::MetaGraphT> &meta_graphT) {
|
||||
int ret = RET_OK;
|
||||
auto valueAbstract = valueNode->abstract();
|
||||
auto valueAbstract = value_node->abstract();
|
||||
auto abstractSequnce = utils::cast<abstract::AbstractSequeuePtr>(valueAbstract);
|
||||
if (abstractSequnce->isa<abstract::AbstractTuple>()) {
|
||||
auto abstractTuple = utils::cast<abstract::AbstractTuplePtr>(valueAbstract);
|
||||
|
@ -724,72 +785,71 @@ int AnfExporter::ProcessValueSequence(const ValueNodePtr &valueNode, std::unique
|
|||
return RET_ERROR;
|
||||
}
|
||||
}
|
||||
(*paramTensor)->dataType = kNumberTypeInt32;
|
||||
(*paramTensor)->dims = {static_cast<int32_t>(shape.size())};
|
||||
(*paramTensor)->nodeType = NodeType_ValueNode;
|
||||
(*paramTensor)->data.resize(shape.size() * sizeof(int));
|
||||
ret = memcpy_s((*paramTensor)->data.data(), shape.size() * sizeof(int32_t), shape.data(),
|
||||
(*schema_tensor)->dataType = kNumberTypeInt32;
|
||||
(*schema_tensor)->dims = {static_cast<int32_t>(shape.size())};
|
||||
(*schema_tensor)->nodeType = NodeType_ValueNode;
|
||||
(*schema_tensor)->data.resize(shape.size() * sizeof(int));
|
||||
ret = memcpy_s((*schema_tensor)->data.data(), shape.size() * sizeof(int32_t), shape.data(),
|
||||
shape.size() * sizeof(int32_t));
|
||||
if (ret != RET_OK) {
|
||||
MS_LOG(ERROR) << "memcpy_s data into paramTensor failed.";
|
||||
MS_LOG(ERROR) << "memcpy_s data into schema_tensor failed.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
node_id_map_[valueNode->fullname_with_scope()] = meta_graphT->allTensors.size();
|
||||
node_id_map_[value_node->fullname_with_scope()] = meta_graphT->allTensors.size();
|
||||
output_cnode->inputIndex.emplace_back(meta_graphT->allTensors.size());
|
||||
meta_graphT->allTensors.emplace_back(std::move(*paramTensor));
|
||||
meta_graphT->allTensors.emplace_back(std::move(*schema_tensor));
|
||||
}
|
||||
return ret;
|
||||
}
|
||||
int AnfExporter::ProcessParamValueLite(const ValueNodePtr &valueNode, std::unique_ptr<schema::TensorT> *paramTensor,
|
||||
const std::shared_ptr<Value> &value, schema::CNodeT *output_cnode,
|
||||
const std::unique_ptr<schema::MetaGraphT> &meta_graphT) {
|
||||
int ret;
|
||||
auto valueLite = std::dynamic_pointer_cast<ParamValueLite>(value);
|
||||
(*paramTensor)->data.resize(valueLite->tensor_size());
|
||||
(*paramTensor)->format = schema::Format(valueLite->format());
|
||||
(*paramTensor)->dataType = valueLite->tensor_type();
|
||||
(*paramTensor)->dims = valueLite->tensor_shape();
|
||||
|
||||
if (train_flag_ && (*paramTensor)->dims.empty()) {
|
||||
(*paramTensor)->dims = {1};
|
||||
int AnfExporter::ProcessTensorInfo(const ValueNodePtr &value_node, std::unique_ptr<schema::TensorT> *schema_tensor,
|
||||
const std::shared_ptr<Value> &value, schema::CNodeT *output_cnode,
|
||||
const std::unique_ptr<schema::MetaGraphT> &meta_graphT) {
|
||||
auto tensor_info = std::dynamic_pointer_cast<tensor::Tensor>(value);
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "Input value is not a tensor";
|
||||
return RET_INPUT_PARAM_INVALID;
|
||||
}
|
||||
auto ret = UpdateTensorTFromTensorInfo(tensor_info, schema_tensor);
|
||||
if (ret != RET_OK) {
|
||||
MS_LOG(ERROR) << "UpdateTensorTFromTensorInfo failed";
|
||||
return ret;
|
||||
}
|
||||
if (train_flag_ && (*schema_tensor)->dims.empty()) {
|
||||
(*schema_tensor)->dims = {1};
|
||||
}
|
||||
|
||||
ret = memcpy_s((*paramTensor)->data.data(), valueLite->tensor_size() * sizeof(uint8_t), valueLite->tensor_addr(),
|
||||
valueLite->tensor_size());
|
||||
if (ret != EOK) {
|
||||
MS_LOG(ERROR) << "memcpy_s data into tensor failed.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
node_id_map_[valueNode->fullname_with_scope()] = meta_graphT->allTensors.size();
|
||||
node_id_map_[value_node->fullname_with_scope()] = meta_graphT->allTensors.size();
|
||||
output_cnode->inputIndex.emplace_back(meta_graphT->allTensors.size());
|
||||
meta_graphT->allTensors.emplace_back(std::move(*paramTensor));
|
||||
meta_graphT->allTensors.emplace_back(std::move(*schema_tensor));
|
||||
return ret;
|
||||
}
|
||||
|
||||
int AnfExporter::ConvertInputValueNode(const std::shared_ptr<AnfNode> &input_anode,
|
||||
const std::unique_ptr<schema::MetaGraphT> &meta_graphT,
|
||||
schema::CNodeT *output_cnode) {
|
||||
auto valueNode = input_anode->cast<ValueNodePtr>();
|
||||
auto paramTensor = std::make_unique<schema::TensorT>();
|
||||
auto value = valueNode->value();
|
||||
auto value_node = input_anode->cast<ValueNodePtr>();
|
||||
auto schema_tensor = std::make_unique<schema::TensorT>();
|
||||
auto value = value_node->value();
|
||||
int ret = RET_OK;
|
||||
|
||||
if (train_flag_) {
|
||||
paramTensor->name = valueNode->fullname_with_scope();
|
||||
schema_tensor->name = value_node->fullname_with_scope();
|
||||
}
|
||||
if (value->isa<tensor::Tensor>()) {
|
||||
ret = ProcessTensor(valueNode, ¶mTensor, value, output_cnode, meta_graphT);
|
||||
ret = ProcessTensor(value_node, &schema_tensor, value, output_cnode, meta_graphT);
|
||||
} else if (value->isa<mindspore::Int32Imm>() || value->isa<mindspore::Int64Imm>()) {
|
||||
ret = ProcessInt32OrInt64Imm(valueNode, ¶mTensor, value, output_cnode, meta_graphT);
|
||||
ret = ProcessInt32OrInt64Imm(value_node, &schema_tensor, value, output_cnode, meta_graphT);
|
||||
} else if (value->isa<mindspore::BoolImm>()) {
|
||||
ProcessBoolImm(valueNode, ¶mTensor, value, output_cnode, meta_graphT);
|
||||
ProcessBoolImm(value_node, &schema_tensor, value, output_cnode, meta_graphT);
|
||||
} else if (value->isa<mindspore::Int>()) {
|
||||
ProcessInt(valueNode, ¶mTensor, output_cnode, meta_graphT);
|
||||
ProcessInt(value_node, &schema_tensor, output_cnode, meta_graphT);
|
||||
} else if (value->isa<mindspore::ValueSequeue>()) {
|
||||
ret = ProcessValueSequence(valueNode, ¶mTensor, value, output_cnode, meta_graphT);
|
||||
ret = ProcessValueSequence(value_node, &schema_tensor, value, output_cnode, meta_graphT);
|
||||
} else if (value->isa<Number>()) {
|
||||
ret = ProcessNumber(valueNode, paramTensor.release(), output_cnode, meta_graphT);
|
||||
} else if (value->isa<mindspore::ParamValueLite>()) {
|
||||
ret = ProcessParamValueLite(valueNode, ¶mTensor, value, output_cnode, meta_graphT);
|
||||
ret = ProcessNumber(value_node, schema_tensor.release(), output_cnode, meta_graphT);
|
||||
} else if (value->isa<mindspore::tensor::Tensor>()) {
|
||||
ret = ProcessTensorInfo(value_node, &schema_tensor, value, output_cnode, meta_graphT);
|
||||
} else if (value->isa<FuncGraph>()) {
|
||||
MS_LOG(INFO) << "op name:" << input_anode->fullname_with_scope() << " input is func_graph";
|
||||
return RET_OK;
|
||||
|
|
|
@ -25,6 +25,7 @@
|
|||
#include "ops/primitive_c.h"
|
||||
#include "ir/func_graph.h"
|
||||
#include "tools/converter/converter_context.h"
|
||||
#include "tools/converter/converter_flags.h"
|
||||
|
||||
using mindspore::ops::PrimitiveC;
|
||||
|
||||
|
@ -52,25 +53,25 @@ class AnfExporter {
|
|||
const std::unique_ptr<schema::MetaGraphT> &meta_graphT, schema::CNodeT *output_cnode);
|
||||
int ConvertInputValueNode(const std::shared_ptr<AnfNode> &input_anode,
|
||||
const std::unique_ptr<schema::MetaGraphT> &meta_graphT, schema::CNodeT *output_cnode);
|
||||
int ProcessTensor(const ValueNodePtr &valueNode, std::unique_ptr<schema::TensorT> *paramTensor,
|
||||
int ProcessTensor(const ValueNodePtr &value_node, std::unique_ptr<schema::TensorT> *schema_tensor,
|
||||
const std::shared_ptr<Value> &value, schema::CNodeT *output_cnode,
|
||||
const std::unique_ptr<schema::MetaGraphT> &meta_graphT);
|
||||
int ProcessInt32OrInt64Imm(const ValueNodePtr &valueNode, std::unique_ptr<schema::TensorT> *paramTensor,
|
||||
int ProcessInt32OrInt64Imm(const ValueNodePtr &value_node, std::unique_ptr<schema::TensorT> *schema_tensor,
|
||||
const std::shared_ptr<Value> &value, schema::CNodeT *output_cnode,
|
||||
const std::unique_ptr<schema::MetaGraphT> &meta_graphT);
|
||||
void ProcessBoolImm(const ValueNodePtr &valueNode, std::unique_ptr<schema::TensorT> *paramTensor,
|
||||
void ProcessBoolImm(const ValueNodePtr &value_node, std::unique_ptr<schema::TensorT> *schema_tensor,
|
||||
const std::shared_ptr<Value> &value, schema::CNodeT *output_cnode,
|
||||
const std::unique_ptr<schema::MetaGraphT> &meta_graphT);
|
||||
void ProcessInt(const ValueNodePtr &valueNode, std::unique_ptr<schema::TensorT> *paramTensor,
|
||||
void ProcessInt(const ValueNodePtr &value_node, std::unique_ptr<schema::TensorT> *schema_tensor,
|
||||
schema::CNodeT *output_cnode, const std::unique_ptr<schema::MetaGraphT> &meta_graphT);
|
||||
int ProcessNumber(const ValueNodePtr &valueNode, schema::TensorT *paramTensor, schema::CNodeT *output_cnode,
|
||||
int ProcessNumber(const ValueNodePtr &value_node, schema::TensorT *schema_tensor, schema::CNodeT *output_cnode,
|
||||
const std::unique_ptr<schema::MetaGraphT> &meta_graphT);
|
||||
int ProcessValueSequence(const ValueNodePtr &valueNode, std::unique_ptr<schema::TensorT> *paramTensor,
|
||||
int ProcessValueSequence(const ValueNodePtr &value_node, std::unique_ptr<schema::TensorT> *schema_tensor,
|
||||
const std::shared_ptr<Value> &value, schema::CNodeT *output_cnode,
|
||||
const std::unique_ptr<schema::MetaGraphT> &meta_graphT);
|
||||
int ProcessParamValueLite(const ValueNodePtr &valueNode, std::unique_ptr<schema::TensorT> *paramTensor,
|
||||
const std::shared_ptr<Value> &value, schema::CNodeT *output_cnode,
|
||||
const std::unique_ptr<schema::MetaGraphT> &meta_graphT);
|
||||
int ProcessTensorInfo(const ValueNodePtr &value_node, std::unique_ptr<schema::TensorT> *schema_tensor,
|
||||
const std::shared_ptr<Value> &value, schema::CNodeT *output_cnode,
|
||||
const std::unique_ptr<schema::MetaGraphT> &meta_graphT);
|
||||
int SetGraphInputIndex(const std::unique_ptr<schema::MetaGraphT> &meta_graphT, const size_t &subgraph_index);
|
||||
int SetGraphoutputIndex(const CNodePtr &cnode, size_t subgraph_index,
|
||||
const std::unique_ptr<schema::MetaGraphT> &meta_graphT, schema::CNodeT *return_node);
|
||||
|
|
|
@ -14,9 +14,10 @@
|
|||
* limitations under the License.
|
||||
*/
|
||||
|
||||
#include "src/common/utils.h"
|
||||
#include "tools/common/tensor_util.h"
|
||||
#include "src/common/utils.h"
|
||||
#include "tools/common/graph_util.h"
|
||||
#include "abstract/utils.h"
|
||||
|
||||
namespace mindspore::lite {
|
||||
std::unique_ptr<QuantParamT> GetTensorQuantParam(const std::unique_ptr<TensorT> &tensor) {
|
||||
|
@ -43,6 +44,111 @@ std::unique_ptr<schema::QuantParamT> CopyQuantParamT(const std::unique_ptr<schem
|
|||
return dstQuantParam;
|
||||
}
|
||||
|
||||
tensor::TensorPtr CreateTensorInfo(const void *data, size_t data_size, const std::vector<int64_t> &shape,
|
||||
TypeId data_type) {
|
||||
tensor::TensorPtr tensor_info = nullptr;
|
||||
if (shape.empty() && data_size == mindspore::abstract::TypeIdSize(data_type)) {
|
||||
ShapeVector scalar_shape = {1};
|
||||
tensor_info = std::make_shared<tensor::Tensor>(data_type, scalar_shape);
|
||||
tensor_info->set_shape({});
|
||||
} else {
|
||||
tensor_info = std::make_shared<tensor::Tensor>(data_type, shape);
|
||||
}
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "new tensor init failed";
|
||||
return nullptr;
|
||||
}
|
||||
if (data_size == 0) {
|
||||
return tensor_info;
|
||||
}
|
||||
if (data == nullptr) {
|
||||
MS_LOG(ERROR) << "input tensor data is nullptr";
|
||||
return nullptr;
|
||||
}
|
||||
auto ret = memcpy_s(tensor_info->data_c(), tensor_info->data().nbytes(), data, data_size);
|
||||
if (ret != EOK) {
|
||||
MS_LOG(ERROR) << "memcpy_s error : " << ret;
|
||||
return nullptr;
|
||||
}
|
||||
return tensor_info;
|
||||
}
|
||||
|
||||
int SetTensorData(const tensor::TensorPtr &tensor_info, const void *data, size_t data_size) {
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "tensor info is nullptr.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
if (data == nullptr) {
|
||||
MS_LOG(ERROR) << "data is nullptr.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto ret = memcpy_s(tensor_info->data_c(), tensor_info->data().nbytes(), data, data_size);
|
||||
if (ret != EOK) {
|
||||
MS_LOG(ERROR) << "memcpy_s error : " << ret;
|
||||
return RET_ERROR;
|
||||
}
|
||||
return RET_OK;
|
||||
}
|
||||
|
||||
std::unique_ptr<schema::TensorT> CreateTensorTFromTensorInfo(const tensor::TensorPtr &tensor_info,
|
||||
const std::string &tensor_name) {
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "Input tensor is nullptr";
|
||||
return nullptr;
|
||||
}
|
||||
auto schema_tensor = std::make_unique<schema::TensorT>();
|
||||
schema_tensor->name = tensor_name;
|
||||
auto ret = UpdateTensorTFromTensorInfo(tensor_info, &schema_tensor);
|
||||
if (ret != RET_OK) {
|
||||
MS_LOG(ERROR) << "Init schema tensor failed";
|
||||
return nullptr;
|
||||
}
|
||||
return schema_tensor;
|
||||
}
|
||||
|
||||
int UpdateTensorTFromTensorInfo(const tensor::TensorPtr &src_tensor, std::unique_ptr<schema::TensorT> *dst_tensor) {
|
||||
if (src_tensor == nullptr) {
|
||||
MS_LOG(ERROR) << "Input tensor info is nullptr";
|
||||
return RET_INPUT_PARAM_INVALID;
|
||||
}
|
||||
if (dst_tensor == nullptr || *dst_tensor == nullptr) {
|
||||
MS_LOG(ERROR) << "Input schema tensor is nullptr";
|
||||
return RET_INPUT_PARAM_INVALID;
|
||||
}
|
||||
auto &schema_tensor = *dst_tensor;
|
||||
schema_tensor->format = schema::Format_NHWC;
|
||||
schema_tensor->dataType = src_tensor->data_type();
|
||||
auto &shape_vector = src_tensor->shape();
|
||||
std::vector<int32_t> dims;
|
||||
(void)std::transform(shape_vector.begin(), shape_vector.end(), std::back_inserter(dims),
|
||||
[](const int64_t &value) { return static_cast<int32_t>(value); });
|
||||
schema_tensor->dims = dims;
|
||||
if (src_tensor->data().data() != nullptr) {
|
||||
schema_tensor->data.resize(src_tensor->data().nbytes());
|
||||
if (EOK != memcpy_s(schema_tensor->data.data(), schema_tensor->data.size(), src_tensor->data().data(),
|
||||
src_tensor->data().nbytes())) {
|
||||
MS_LOG(ERROR) << "memcpy_s failed.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
}
|
||||
return RET_OK;
|
||||
}
|
||||
|
||||
int InitParameterFromTensorInfo(const ParameterPtr ¶m_node, const tensor::TensorPtr &tensor_info) {
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "tensor info is nullptr.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto abstract_tensor = tensor_info->ToAbstract();
|
||||
if (abstract_tensor == nullptr) {
|
||||
MS_LOG(ERROR) << "Create abstract tensor failed.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
param_node->set_abstract(abstract_tensor);
|
||||
param_node->set_default_param(tensor_info);
|
||||
return RET_OK;
|
||||
}
|
||||
|
||||
size_t GetElementSize(const TensorT &tensor) { return GetElementSize(TypeId(tensor.dataType)); }
|
||||
|
||||
size_t GetElementSize(const TypeId &dataType) {
|
||||
|
|
|
@ -20,12 +20,14 @@
|
|||
#include <cmath>
|
||||
#include <unordered_map>
|
||||
#include <memory>
|
||||
#include <algorithm>
|
||||
#include <utility>
|
||||
#include <string>
|
||||
#include <vector>
|
||||
#include "schema/inner/model_generated.h"
|
||||
#include "src/common/log_adapter.h"
|
||||
#include "ir/dtype/type_id.h"
|
||||
#include "ir/tensor.h"
|
||||
#include "src/common/utils.h"
|
||||
|
||||
namespace mindspore {
|
||||
|
@ -41,6 +43,18 @@ using schema::Format::Format_NHWC;
|
|||
|
||||
std::unique_ptr<QuantParamT> GetTensorQuantParam(const std::unique_ptr<TensorT> &tensor);
|
||||
|
||||
tensor::TensorPtr CreateTensorInfo(const void *data, size_t data_size, const std::vector<int64_t> &shape,
|
||||
TypeId data_type);
|
||||
|
||||
int SetTensorData(const tensor::TensorPtr &tensor_info, const void *data, size_t data_size);
|
||||
|
||||
std::unique_ptr<schema::TensorT> CreateTensorTFromTensorInfo(const tensor::TensorPtr &tensor_info,
|
||||
const std::string &tensor_name = "");
|
||||
|
||||
int UpdateTensorTFromTensorInfo(const tensor::TensorPtr &src_tensor, std::unique_ptr<schema::TensorT> *dst_tensor);
|
||||
|
||||
int InitParameterFromTensorInfo(const ParameterPtr ¶m_node, const tensor::TensorPtr &tensor_info);
|
||||
|
||||
size_t GetElementSize(const TensorT &tensor);
|
||||
|
||||
size_t GetElementSize(const TypeId &dataType);
|
||||
|
|
|
@ -133,7 +133,7 @@ STATUS TensorQuantPass::Run(schema::MetaGraphT *graph) {
|
|||
continue;
|
||||
}
|
||||
if (tensor->quantParams.size() != 1) { // perchannel
|
||||
MS_LOG(ERROR) << "perchannel doquant is not supported yet";
|
||||
MS_LOG(ERROR) << "perchannel do quant is not supported yet";
|
||||
return RET_ERROR;
|
||||
}
|
||||
// perlayer
|
||||
|
|
|
@ -15,7 +15,6 @@
|
|||
*/
|
||||
#include "tools/converter/parser/caffe/caffe_model_parser.h"
|
||||
#include <vector>
|
||||
#include <iostream>
|
||||
#include <map>
|
||||
#include <memory>
|
||||
#include <algorithm>
|
||||
|
@ -23,7 +22,7 @@
|
|||
#include "tools/converter/parser/caffe/caffe_inspector.h"
|
||||
#include "tools/common/graph_util.h"
|
||||
#include "tools/common/protobuf_utils.h"
|
||||
#include "src/param_value_lite.h"
|
||||
#include "tools/common/tensor_util.h"
|
||||
#include "ops/return.h"
|
||||
#include "ops/make_tuple.h"
|
||||
#include "ops/tuple_get_item.h"
|
||||
|
@ -350,8 +349,6 @@ STATUS CaffeModelParser::ConvertBlobs(const caffe::LayerParameter &layer, std::v
|
|||
std::vector<int64_t> shape_vector;
|
||||
(void)std::transform(shape.begin(), shape.end(), std::back_inserter(shape_vector),
|
||||
[](const int32_t &value) { return static_cast<int64_t>(value); });
|
||||
auto abstract_tensor = std::make_shared<abstract::AbstractTensor>(type_ptr, shape_vector);
|
||||
parameter->set_abstract(abstract_tensor);
|
||||
if (layer.type() == "Convolution" || layer.type() == "Deconvolution") {
|
||||
if (i == 0) {
|
||||
parameter->set_name(layer.name() + "/weight");
|
||||
|
@ -361,40 +358,34 @@ STATUS CaffeModelParser::ConvertBlobs(const caffe::LayerParameter &layer, std::v
|
|||
} else {
|
||||
parameter->set_name(layer.name() + "/input-" + std::to_string(i + layer.top_size()));
|
||||
}
|
||||
ParamValueLitePtr param_value = std::make_shared<ParamValueLite>();
|
||||
MS_ASSERT(param_value != nullptr);
|
||||
param_value->set_tensor_shape(shape);
|
||||
param_value->set_tensor_type(TypeId::kNumberTypeFloat32);
|
||||
param_value->set_format(schema::Format::Format_NCHW);
|
||||
|
||||
int count = 0;
|
||||
tensor::TensorPtr tensor_info = nullptr;
|
||||
if (layer.blobs(i).double_data_size() > 0) {
|
||||
count = layer.blobs(i).double_data_size();
|
||||
auto buf = std::make_unique<float[]>(count);
|
||||
for (int j = 0; j < count; ++j) {
|
||||
buf[j] = layer.blobs(j).double_data(j);
|
||||
}
|
||||
param_value->set_tensor_addr(buf.release());
|
||||
tensor_info = CreateTensorInfo(buf.get(), count * sizeof(float), shape_vector, TypeId::kNumberTypeFloat32);
|
||||
} else {
|
||||
count = layer.blobs(i).data_size();
|
||||
auto buf = std::make_unique<float[]>(count);
|
||||
if (buf == nullptr) {
|
||||
MS_LOG(INFO) << "new buffer failed";
|
||||
return RET_NULL_PTR;
|
||||
}
|
||||
const float *data_ptr = layer.blobs(i).data().data();
|
||||
if (data_ptr == nullptr) {
|
||||
MS_LOG(INFO) << "data of origin layer is nullptr";
|
||||
return RET_NULL_PTR;
|
||||
}
|
||||
if (EOK != ::memcpy_s(buf.get(), count * sizeof(float), data_ptr, count * sizeof(float))) {
|
||||
MS_LOG(ERROR) << "memcpy_s failed.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
param_value->set_tensor_addr(buf.release());
|
||||
tensor_info = CreateTensorInfo(data_ptr, count * sizeof(float), shape_vector, TypeId::kNumberTypeFloat32);
|
||||
}
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "create tensor info failed";
|
||||
return RET_NULL_PTR;
|
||||
}
|
||||
auto status = InitParameterFromTensorInfo(parameter, tensor_info);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "init parameter from tensor info failed";
|
||||
return RET_ERROR;
|
||||
}
|
||||
param_value->set_tensor_size(count * sizeof(float));
|
||||
parameter->set_default_param(param_value);
|
||||
const_parameters->emplace_back(parameter);
|
||||
}
|
||||
return RET_OK;
|
||||
|
|
|
@ -17,19 +17,13 @@
|
|||
#include "tools/converter/parser/onnx/onnx_constant_parser.h"
|
||||
#include <vector>
|
||||
#include <memory>
|
||||
#include <algorithm>
|
||||
#include "tools/converter/parser/onnx/onnx_model_parser.h"
|
||||
#include "ops/constant.h"
|
||||
#include "src/param_value_lite.h"
|
||||
#include "tools/common/tensor_util.h"
|
||||
|
||||
namespace mindspore {
|
||||
namespace lite {
|
||||
STATUS OnnxConstantParser::AddDataInfoAttr(const onnx::TensorProto &onnx_const_tensor, ops::PrimitiveC *prim) {
|
||||
ParamValueLitePtr param_value = std::make_shared<ParamValueLite>();
|
||||
if (param_value == nullptr) {
|
||||
MS_LOG(ERROR) << "new a paramValueLite failed.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto data_type =
|
||||
OnnxModelParser::GetDataTypeFromOnnx(static_cast<onnx::TensorProto_DataType>(onnx_const_tensor.data_type()));
|
||||
if (data_type == kTypeUnknown) {
|
||||
|
@ -41,14 +35,16 @@ STATUS OnnxConstantParser::AddDataInfoAttr(const onnx::TensorProto &onnx_const_t
|
|||
std::vector<int> shape;
|
||||
std::transform(shape_vector.begin(), shape_vector.end(), std::back_inserter(shape),
|
||||
[](const int64_t &val) { return static_cast<int32_t>(val); });
|
||||
param_value->set_tensor_type(data_type);
|
||||
param_value->set_tensor_shape(shape);
|
||||
param_value->set_format(schema::Format_NCHW);
|
||||
if (OnnxModelParser::CopyOnnxTensorData(onnx_const_tensor, param_value) != RET_OK) {
|
||||
auto tensor_info = std::make_shared<tensor::Tensor>(data_type, shape_vector);
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "new a paramValueLite failed.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
if (OnnxModelParser::CopyOnnxTensorData(onnx_const_tensor, tensor_info) != RET_OK) {
|
||||
MS_LOG(ERROR) << "get value failed.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
prim->set_attr("const_data", param_value);
|
||||
prim->set_attr("const_data", tensor_info);
|
||||
return RET_OK;
|
||||
}
|
||||
|
||||
|
|
|
@ -19,70 +19,45 @@
|
|||
#include <memory>
|
||||
#include <vector>
|
||||
#include <algorithm>
|
||||
#include "src/param_value_lite.h"
|
||||
#include "tools/common/tensor_util.h"
|
||||
#include "ops/constant.h"
|
||||
|
||||
namespace mindspore {
|
||||
namespace lite {
|
||||
STATUS OnnxGivenTensorFillParser::ParseInt8GivenIntTensorFill(const onnx::NodeProto &onnx_node, ops::PrimitiveC *prim,
|
||||
const std::vector<int> &shape) {
|
||||
ParamValueLitePtr param_value = std::make_shared<ParamValueLite>();
|
||||
|
||||
int data_count = std::accumulate(shape.begin(), shape.end(), 1, std::multiplies<int>());
|
||||
auto iter = std::find_if(onnx_node.attribute().begin(), onnx_node.attribute().end(),
|
||||
[](const onnx::AttributeProto &attr) { return attr.name() == "values"; });
|
||||
if (iter == onnx_node.attribute().end()) {
|
||||
return RET_OK;
|
||||
}
|
||||
ShapeVector shape_vector(shape.begin(), shape.end());
|
||||
size_t data_size = data_count * sizeof(int64_t) / sizeof(uint8_t);
|
||||
char *param_data = new (std::nothrow) char[data_size];
|
||||
if (param_data == nullptr) {
|
||||
MS_LOG(ERROR) << "new char[] failed";
|
||||
return RET_MEMORY_FAILED;
|
||||
}
|
||||
if (iter->ints().data() == nullptr) {
|
||||
MS_LOG(ERROR) << "origin ints data in onnx is nullptr";
|
||||
delete[] param_data;
|
||||
return RET_NULL_PTR;
|
||||
}
|
||||
if (memcpy_s(param_data, data_size, iter->ints().data(), data_size) != EOK) {
|
||||
MS_LOG(ERROR) << "memcpy data failed.";
|
||||
delete[] param_data;
|
||||
auto tensor_info = CreateTensorInfo(iter->ints().data(), data_size, shape_vector, kNumberTypeInt64);
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "Create tensor info failed";
|
||||
return RET_ERROR;
|
||||
}
|
||||
param_value->set_tensor_shape(shape);
|
||||
param_value->set_format(schema::Format_NUM_OF_FORMAT);
|
||||
param_value->set_tensor_type(kNumberTypeInt64);
|
||||
param_value->SetTensorData(param_data, data_size);
|
||||
prim->set_attr("const_data", param_value);
|
||||
prim->set_attr("const_data", tensor_info);
|
||||
return RET_OK;
|
||||
}
|
||||
|
||||
STATUS OnnxGivenTensorFillParser::ParseInt8GivenTensorFill(const onnx::NodeProto &onnx_node, ops::PrimitiveC *prim,
|
||||
const std::vector<int> &shape) {
|
||||
ParamValueLitePtr param_value = std::make_shared<ParamValueLite>();
|
||||
|
||||
int data_count = std::accumulate(shape.begin(), shape.end(), 1, std::multiplies<int64_t>());
|
||||
auto iter = std::find_if(onnx_node.attribute().begin(), onnx_node.attribute().end(),
|
||||
[](const onnx::AttributeProto &attr) { return attr.name() == "values"; });
|
||||
if (iter == onnx_node.attribute().end()) {
|
||||
return RET_OK;
|
||||
}
|
||||
char *param_data = new (std::nothrow) char[data_count];
|
||||
if (param_data == nullptr) {
|
||||
MS_LOG(ERROR) << "new char[] failed";
|
||||
return RET_MEMORY_FAILED;
|
||||
}
|
||||
if (memcpy_s(param_data, data_count, iter->s().data(), data_count) != EOK) {
|
||||
MS_LOG(ERROR) << "memcpy data failed.";
|
||||
delete[] param_data;
|
||||
ShapeVector shape_vector(shape.begin(), shape.end());
|
||||
auto tensor_info = CreateTensorInfo(iter->s().data(), data_count, shape_vector, kNumberTypeUInt8);
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "Create tensor info failed";
|
||||
return RET_ERROR;
|
||||
}
|
||||
param_value->set_tensor_shape(shape);
|
||||
param_value->set_format(schema::Format_NUM_OF_FORMAT);
|
||||
param_value->set_tensor_type(kNumberTypeUInt8);
|
||||
param_value->SetTensorData(param_data, data_count);
|
||||
prim->set_attr("const_data", param_value);
|
||||
prim->set_attr("const_data", tensor_info);
|
||||
return RET_OK;
|
||||
}
|
||||
ops::PrimitiveC *OnnxGivenTensorFillParser::Parse(const onnx::GraphProto &onnx_graph,
|
||||
|
|
|
@ -20,15 +20,16 @@
|
|||
#include <set>
|
||||
#include <unordered_map>
|
||||
#include <utility>
|
||||
#include "tools/optimizer/common/gllo_utils.h"
|
||||
#include "src/common/utils.h"
|
||||
#include "tools/common/graph_util.h"
|
||||
#include "tools/common/protobuf_utils.h"
|
||||
#include "tools/common/tensor_util.h"
|
||||
#include "ops/return.h"
|
||||
#include "ops/make_tuple.h"
|
||||
#include "ops/tensor_list_stack.h"
|
||||
#include "ops/tuple_get_item.h"
|
||||
#include "ir/func_graph.h"
|
||||
#include "src/param_value_lite.h"
|
||||
#include "tools/converter/converter_flags.h"
|
||||
|
||||
namespace mindspore {
|
||||
|
@ -209,6 +210,7 @@ STATUS OnnxModelParser::ConvertNodes(const onnx::GraphProto &onnx_graph, const F
|
|||
status = RET_ERROR;
|
||||
continue;
|
||||
}
|
||||
primitive_c->AddAttr(mindspore::opt::kWeightFormat, MakeValue<int64_t>(Format_NCHW));
|
||||
status = ConvertOpQuantParams(onnx_node, primitive_c);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "convert " << onnx_node.op_type() << " quant param failed.";
|
||||
|
@ -429,25 +431,14 @@ STATUS OnnxModelParser::BuildCNode(const onnx::NodeProto &onnx_node, const FuncG
|
|||
ext_subgraph_input->set_abstract(outside_input_node->abstract());
|
||||
ext_subgraph_input->set_name(input_name);
|
||||
if (outside_input_node->isa<Parameter>()) {
|
||||
auto param_value = outside_input_node->cast<ParameterPtr>()->default_param()->cast<ParamValueLitePtr>();
|
||||
auto copy_param_value = std::make_shared<ParamValueLite>();
|
||||
auto copy_data = new (std::nothrow) char[param_value->tensor_size()];
|
||||
if (copy_data == nullptr) {
|
||||
MS_LOG(ERROR) << "new char[] failed";
|
||||
return RET_MEMORY_FAILED;
|
||||
}
|
||||
auto ret =
|
||||
memcpy_s(copy_data, param_value->tensor_size(), param_value->tensor_addr(), param_value->tensor_size());
|
||||
if (ret != EOK) {
|
||||
delete[](copy_data);
|
||||
MS_LOG(ERROR) << "memcpy error: " << ret;
|
||||
auto tensor_info = outside_input_node->cast<ParameterPtr>()->default_param()->cast<tensor::TensorPtr>();
|
||||
auto copy_tensor_info = CreateTensorInfo(tensor_info->data_c(), tensor_info->Size(), tensor_info->shape(),
|
||||
tensor_info->data_type());
|
||||
if (copy_tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "memcpy failed.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
copy_param_value->set_tensor_shape(param_value->tensor_shape());
|
||||
copy_param_value->set_format(param_value->format());
|
||||
copy_param_value->set_tensor_type(param_value->tensor_type());
|
||||
copy_param_value->SetTensorData(copy_data, param_value->tensor_size());
|
||||
ext_subgraph_input->set_default_param(copy_param_value);
|
||||
ext_subgraph_input->set_default_param(copy_tensor_info);
|
||||
} else {
|
||||
// output inside cnode need make extra input
|
||||
graph_inputs->emplace_back(ext_subgraph_input);
|
||||
|
@ -675,16 +666,16 @@ STATUS OnnxModelParser::CopyTensorQuantParam(const std::string &tensor_name, Qua
|
|||
MS_LOG(ERROR) << "quant param get failed";
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto param_value_lite = quant_parameter_node->default_param()->cast<ParamValueLitePtr>();
|
||||
if (param_value_lite == nullptr) {
|
||||
MS_LOG(ERROR) << "parameterNode's default param is not paramValueLite";
|
||||
auto tensor_info = quant_parameter_node->default_param()->cast<tensor::TensorPtr>();
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "parameterNode's default param is not tensor::TensorPtr";
|
||||
return RET_ERROR;
|
||||
}
|
||||
if (scale_or_not) {
|
||||
quant_param->scale = *reinterpret_cast<float *>(param_value_lite->tensor_addr());
|
||||
quant_param->scale = *reinterpret_cast<float *>(tensor_info->data_c());
|
||||
quant_param->inited = true;
|
||||
} else {
|
||||
quant_param->zeroPoint = *reinterpret_cast<int64_t *>(param_value_lite->tensor_addr());
|
||||
quant_param->zeroPoint = *reinterpret_cast<int64_t *>(tensor_info->data_c());
|
||||
quant_param->inited = true;
|
||||
}
|
||||
return RET_OK;
|
||||
|
@ -704,10 +695,14 @@ ParameterPtr CreateConstParamter(const FuncGraphPtr &anf_graph, int val) {
|
|||
return nullptr;
|
||||
}
|
||||
tensor_data[0] = val;
|
||||
auto param_value = std::make_shared<ParamValueLite>();
|
||||
param_value->set_tensor_shape({});
|
||||
param_value->SetTensorData(tensor_data, sizeof(int));
|
||||
const_node->set_default_param(param_value);
|
||||
auto tensor_info = CreateTensorInfo(tensor_data, 1 * sizeof(int), {1}, kNumberTypeInt32);
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "create tensor info failed.";
|
||||
delete[] tensor_data;
|
||||
return nullptr;
|
||||
}
|
||||
delete[] tensor_data;
|
||||
const_node->set_default_param(tensor_info);
|
||||
return const_node;
|
||||
}
|
||||
|
||||
|
@ -841,10 +836,9 @@ STATUS OnnxModelParser::AddTensorArrayEdge(const FuncGraphPtr &anf_graph, std::v
|
|||
auto while_tensor_array_input = anf_root_graph->add_parameter();
|
||||
std::vector<int64_t> shape_vector;
|
||||
auto abstract_tensor = std::make_shared<abstract::AbstractTensor>(kTensorType, shape_vector);
|
||||
auto param_value = std::make_shared<ParamValueLite>();
|
||||
param_value->set_tensor_type(kObjectTypeTensorType);
|
||||
auto tensor_info = std::make_shared<tensor::Tensor>(kObjectTypeTensorType, shape_vector);
|
||||
while_tensor_array_input->set_abstract(abstract_tensor);
|
||||
while_tensor_array_input->set_default_param(param_value);
|
||||
while_tensor_array_input->set_default_param(tensor_info);
|
||||
while_tensor_array_input->set_name(loop_node_name + "_scan_outputs_tensorarray");
|
||||
root_while_node->add_input(while_tensor_array_input);
|
||||
|
||||
|
@ -1035,33 +1029,18 @@ STATUS OnnxModelParser::BuildParameterNodeForQuantParam(const void *data, const
|
|||
}
|
||||
parameter_node->set_abstract(abstract_tensor);
|
||||
parameter_node->set_name(name);
|
||||
std::vector<int> shape;
|
||||
ParamValueLitePtr param_value = std::make_shared<ParamValueLite>();
|
||||
if (param_value == nullptr) {
|
||||
MS_LOG(ERROR) << "new param_value failed";
|
||||
return RET_MEMORY_FAILED;
|
||||
}
|
||||
param_value->set_tensor_shape(shape);
|
||||
param_value->set_format(schema::Format_NUM_OF_FORMAT);
|
||||
param_value->set_tensor_type(type);
|
||||
int data_size = 0;
|
||||
if (type == kNumberTypeFloat32) {
|
||||
data_size = sizeof(float);
|
||||
} else {
|
||||
data_size = sizeof(int64_t);
|
||||
}
|
||||
auto *tensor_data = new (std::nothrow) char[data_size];
|
||||
if (tensor_data == nullptr) {
|
||||
MS_LOG(ERROR) << "new char[] failed";
|
||||
return RET_MEMORY_FAILED;
|
||||
}
|
||||
if (memcpy_s(tensor_data, data_size, data, data_size) != EOK) {
|
||||
MS_LOG(ERROR) << "memcpy data failed.";
|
||||
delete[] tensor_data;
|
||||
auto tensor_info = CreateTensorInfo(data, data_size, {1}, type);
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "create tensor info failed.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
param_value->SetTensorData(tensor_data, data_size);
|
||||
parameter_node->set_default_param(param_value);
|
||||
parameter_node->set_default_param(tensor_info);
|
||||
anf_nodes_map_.emplace(name, parameter_node);
|
||||
return RET_OK;
|
||||
}
|
||||
|
@ -1078,26 +1057,23 @@ STATUS OnnxModelParser::BuildParameterNode(const ParameterPtr ¶meter_node, c
|
|||
parameter_node->set_abstract(abstract_tensor);
|
||||
parameter_node->set_name(tensor.name());
|
||||
|
||||
ParamValueLitePtr param_value = std::make_shared<ParamValueLite>();
|
||||
auto tensor_info = std::make_shared<tensor::Tensor>(data_type, shape_vector);
|
||||
std::vector<int> shape;
|
||||
std::transform(shape_vector.begin(), shape_vector.end(), std::back_inserter(shape),
|
||||
[](const int64_t &value) { return static_cast<int>(value); });
|
||||
param_value->set_tensor_shape(shape);
|
||||
param_value->set_tensor_type(data_type);
|
||||
param_value->set_format(schema::Format::Format_NCHW);
|
||||
auto status = CopyOnnxTensorData(tensor, param_value);
|
||||
auto status = CopyOnnxTensorData(tensor, tensor_info);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "copy data failed.";
|
||||
return status;
|
||||
}
|
||||
parameter_node->set_default_param(param_value);
|
||||
parameter_node->set_default_param(tensor_info);
|
||||
return RET_OK;
|
||||
}
|
||||
|
||||
STATUS OnnxModelParser::CopyOnnxTensorData(const onnx::TensorProto &onnx_const_tensor,
|
||||
const ParamValueLitePtr ¶m_value_lite) {
|
||||
if (param_value_lite == nullptr) {
|
||||
MS_LOG(ERROR) << "param_value_lite is nullptr.";
|
||||
const tensor::TensorPtr &tensor_info) {
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "tensor_info is nullptr.";
|
||||
return RET_NULL_PTR;
|
||||
}
|
||||
size_t data_count = 1;
|
||||
|
@ -1150,17 +1126,11 @@ STATUS OnnxModelParser::CopyOnnxTensorData(const onnx::TensorProto &onnx_const_t
|
|||
MS_LOG(ERROR) << "origin data in onnx model is nullptr";
|
||||
return RET_MEMORY_FAILED;
|
||||
}
|
||||
char *param_data = new (std::nothrow) char[data_size];
|
||||
if (param_data == nullptr) {
|
||||
MS_LOG(ERROR) << "new char[] failed";
|
||||
return RET_MEMORY_FAILED;
|
||||
}
|
||||
if (memcpy_s(static_cast<void *>(param_data), data_size, onnx_data, data_size) != EOK) {
|
||||
auto tensor_data = reinterpret_cast<uint8_t *>(tensor_info->data_c());
|
||||
if (memcpy_s(tensor_data, data_size, onnx_data, data_size) != EOK) {
|
||||
MS_LOG(ERROR) << "memcpy_s failed";
|
||||
delete[] param_data;
|
||||
return RET_ERROR;
|
||||
}
|
||||
param_value_lite->SetTensorData(param_data, data_size);
|
||||
return RET_OK;
|
||||
}
|
||||
|
||||
|
|
|
@ -31,7 +31,6 @@
|
|||
#include "tools/converter/model_parser.h"
|
||||
#include "tools/converter/parser/onnx/onnx_node_parser_registry.h"
|
||||
#include "proto/onnx.pb.h"
|
||||
#include "src/param_value_lite.h"
|
||||
|
||||
namespace mindspore {
|
||||
namespace lite {
|
||||
|
@ -44,8 +43,8 @@ class OnnxModelParser : public ModelParser {
|
|||
FuncGraphPtr Parse(const std::string &model_file, const std::string &weight_file,
|
||||
const QuantType &quant_type) override;
|
||||
static TypeId GetDataTypeFromOnnx(onnx::TensorProto_DataType onnx_type);
|
||||
static STATUS CopyOnnxTensorData(const onnx::TensorProto &onnx_const_value,
|
||||
const ParamValueLitePtr ¶m_value_lite);
|
||||
static STATUS CopyOnnxTensorData(const onnx::TensorProto &onnx_const_tensor,
|
||||
const tensor::TensorPtr ¶m_value_lite);
|
||||
|
||||
private:
|
||||
STATUS InitOriginModel(const std::string &model_file);
|
||||
|
|
|
@ -20,7 +20,6 @@
|
|||
#include <set>
|
||||
#include "src/common/log_adapter.h"
|
||||
#include "src/common/utils.h"
|
||||
#include "src/param_value_lite.h"
|
||||
#include "tools/common/graph_util.h"
|
||||
#include "tools/common/protobuf_utils.h"
|
||||
#include "tools/converter/parser/tf/tf_node_parser_registry.h"
|
||||
|
@ -29,6 +28,7 @@
|
|||
#include "ops/make_tuple.h"
|
||||
#include "ops/tuple_get_item.h"
|
||||
#include "ir/anf.h"
|
||||
#include "abstract/utils.h"
|
||||
#include "tools/converter/converter_flags.h"
|
||||
|
||||
namespace mindspore {
|
||||
|
@ -85,12 +85,30 @@ STATUS CheckStrView(std::string_view str_view, uint64_t *scratch) {
|
|||
return RET_OK;
|
||||
}
|
||||
|
||||
STATUS GetFloatValue(const tensorflow::TensorProto &tensor_proto, const tensorflow::TensorShapeProto &tensor_shape,
|
||||
ParamValueLitePtr param_value, int shape_size) {
|
||||
auto tensor_data = new (std::nothrow) float[shape_size];
|
||||
int GetShapeSize(const tensorflow::TensorProto &tensor_proto) {
|
||||
auto &tensor_shape = tensor_proto.tensor_shape();
|
||||
int shape_size = 1;
|
||||
for (int i = 0; i < tensor_shape.dim_size(); i++) {
|
||||
shape_size *= tensor_shape.dim(i).size();
|
||||
}
|
||||
return shape_size;
|
||||
}
|
||||
|
||||
STATUS SetFloatTensorInfo(const tensorflow::TensorProto &tensor_proto, tensor::TensorPtr *tensor_info) {
|
||||
auto shape_size = GetShapeSize(tensor_proto);
|
||||
auto &tensor_shape = tensor_proto.tensor_shape();
|
||||
ShapeVector shape_vector{};
|
||||
for (int i = 0; i < tensor_shape.dim_size(); i++) {
|
||||
shape_vector.push_back(tensor_shape.dim(i).size());
|
||||
}
|
||||
*tensor_info = CreateTensorInfo(nullptr, 0, shape_vector, kNumberTypeFloat32);
|
||||
if (*tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "create tensor data failed.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto tensor_data = reinterpret_cast<float *>((*tensor_info)->data_c());
|
||||
if (tensor_data == nullptr) {
|
||||
MS_LOG(ERROR) << "new data failed";
|
||||
delete[] tensor_data;
|
||||
return RET_ERROR;
|
||||
}
|
||||
|
||||
|
@ -107,17 +125,25 @@ STATUS GetFloatValue(const tensorflow::TensorProto &tensor_proto, const tensorfl
|
|||
return RET_ERROR;
|
||||
}
|
||||
}
|
||||
auto tensor_size = shape_size * sizeof(float);
|
||||
param_value->SetTensorData(tensor_data, tensor_size);
|
||||
|
||||
return RET_OK;
|
||||
}
|
||||
|
||||
STATUS GetInt32Value(const tensorflow::TensorProto &tensor_proto, const tensorflow::TensorShapeProto &tensor_shape,
|
||||
ParamValueLitePtr param_value, int shape_size) {
|
||||
auto tensor_data = new (std::nothrow) int[shape_size];
|
||||
STATUS SetInt32TensorInfo(const tensorflow::TensorProto &tensor_proto, tensor::TensorPtr *tensor_info) {
|
||||
auto shape_size = GetShapeSize(tensor_proto);
|
||||
auto &tensor_shape = tensor_proto.tensor_shape();
|
||||
ShapeVector shape_vector{};
|
||||
for (int i = 0; i < tensor_shape.dim_size(); i++) {
|
||||
shape_vector.push_back(tensor_shape.dim(i).size());
|
||||
}
|
||||
*tensor_info = CreateTensorInfo(nullptr, 0, shape_vector, kNumberTypeInt32);
|
||||
if (*tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "create tensor data failed.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto tensor_data = reinterpret_cast<int *>((*tensor_info)->data_c());
|
||||
if (tensor_data == nullptr) {
|
||||
MS_LOG(ERROR) << "new data failed";
|
||||
delete[] tensor_data;
|
||||
return RET_ERROR;
|
||||
}
|
||||
|
||||
|
@ -134,21 +160,29 @@ STATUS GetInt32Value(const tensorflow::TensorProto &tensor_proto, const tensorfl
|
|||
return RET_ERROR;
|
||||
}
|
||||
}
|
||||
auto tensor_size = shape_size * sizeof(int);
|
||||
param_value->SetTensorData(tensor_data, tensor_size);
|
||||
|
||||
return RET_OK;
|
||||
}
|
||||
|
||||
STATUS GetInt64Value(const tensorflow::TensorProto &tensor_proto, const tensorflow::TensorShapeProto &tensor_shape,
|
||||
ParamValueLitePtr param_value, int shape_size) {
|
||||
param_value->set_tensor_type(kNumberTypeInt32);
|
||||
auto *tensor_data = new (std::nothrow) int[shape_size];
|
||||
STATUS SetInt64TensorInfo(const tensorflow::TensorProto &tensor_proto, tensor::TensorPtr *tensor_info) {
|
||||
auto shape_size = GetShapeSize(tensor_proto);
|
||||
auto &tensor_shape = tensor_proto.tensor_shape();
|
||||
ShapeVector shape_vector{};
|
||||
for (int i = 0; i < tensor_shape.dim_size(); i++) {
|
||||
shape_vector.push_back(tensor_shape.dim(i).size());
|
||||
}
|
||||
*tensor_info = CreateTensorInfo(nullptr, 0, shape_vector, kNumberTypeInt32);
|
||||
if (*tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "create tensor data failed.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto tensor_data = reinterpret_cast<int *>((*tensor_info)->data_c());
|
||||
if (tensor_data == nullptr) {
|
||||
MS_LOG(ERROR) << "new data failed";
|
||||
delete[] tensor_data;
|
||||
return RET_ERROR;
|
||||
}
|
||||
if (tensor_shape.dim_size() == 0) { // scalar
|
||||
if (tensor_proto.tensor_shape().dim_size() == 0) { // scalar
|
||||
const auto &origin_data = tensor_proto.int64_val();
|
||||
for (int i = 0; i < tensor_proto.int64_val_size(); ++i) {
|
||||
if (origin_data[i] > static_cast<int64_t>(INT32_MAX) || origin_data[i] < static_cast<int64_t>(INT32_MIN)) {
|
||||
|
@ -170,14 +204,84 @@ STATUS GetInt64Value(const tensorflow::TensorProto &tensor_proto, const tensorfl
|
|||
}
|
||||
}
|
||||
}
|
||||
param_value->SetTensorData(tensor_data, shape_size * sizeof(int32_t));
|
||||
|
||||
return RET_OK;
|
||||
}
|
||||
|
||||
STATUS SetBoolTensorInfo(const tensorflow::TensorProto &tensor_proto, tensor::TensorPtr *tensor_info) {
|
||||
auto shape_size = GetShapeSize(tensor_proto);
|
||||
auto &tensor_shape = tensor_proto.tensor_shape();
|
||||
ShapeVector shape_vector{};
|
||||
for (int i = 0; i < tensor_shape.dim_size(); i++) {
|
||||
shape_vector.push_back(tensor_shape.dim(i).size());
|
||||
}
|
||||
*tensor_info = CreateTensorInfo(nullptr, 0, shape_vector, kNumberTypeBool);
|
||||
if (*tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "create tensor data failed.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto tensor_data = reinterpret_cast<bool *>((*tensor_info)->data_c());
|
||||
if (tensor_data == nullptr) {
|
||||
MS_LOG(ERROR) << "new data failed";
|
||||
delete[] tensor_data;
|
||||
return RET_ERROR;
|
||||
}
|
||||
|
||||
if (tensor_proto.bool_val_size() == 1) {
|
||||
int value = tensor_proto.bool_val(0);
|
||||
for (int i = 0; i < shape_size; i++) {
|
||||
tensor_data[i] = value;
|
||||
}
|
||||
}
|
||||
|
||||
return RET_OK;
|
||||
}
|
||||
|
||||
STATUS SetStringTensorInfo(const tensorflow::TensorProto &tensor_proto, tensor::TensorPtr *tensor_info) {
|
||||
auto &tensor_shape = tensor_proto.tensor_shape();
|
||||
ShapeVector shape_vector{};
|
||||
for (int i = 0; i < tensor_shape.dim_size(); i++) {
|
||||
shape_vector.push_back(tensor_shape.dim(i).size());
|
||||
}
|
||||
std::string shape_str;
|
||||
shape_str += std::to_string(shape_vector.size()) + ",";
|
||||
for (auto &dim : shape_vector) {
|
||||
shape_str += std::to_string(dim) + ",";
|
||||
}
|
||||
|
||||
auto tensor_data = new (std::nothrow) string;
|
||||
if (tensor_proto.string_val_size() == 1) {
|
||||
*tensor_data = tensor_proto.string_val(0);
|
||||
} else {
|
||||
MS_LOG(ERROR) << "string size bigger than one, not support.";
|
||||
delete tensor_data;
|
||||
return RET_ERROR;
|
||||
}
|
||||
|
||||
shape_vector = {static_cast<int64_t>(shape_str.size() + (*tensor_data).size())};
|
||||
*tensor_info = CreateTensorInfo(nullptr, 0, shape_vector, kObjectTypeString);
|
||||
if (*tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "create tensor info failed.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto tensor_info_data = reinterpret_cast<uint8_t *>((*tensor_info)->data_c());
|
||||
if (memcpy_s(tensor_info_data, shape_str.size(), shape_str.data(), shape_str.size()) != EOK) {
|
||||
MS_LOG(ERROR) << "memcpy failed.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
if (memcpy_s(tensor_info_data + shape_str.size(), (*tensor_data).size(), (*tensor_data).data(),
|
||||
(*tensor_data).size()) != EOK) {
|
||||
MS_LOG(ERROR) << "memcpy failed.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
|
||||
delete tensor_data;
|
||||
return RET_OK;
|
||||
}
|
||||
|
||||
} // namespace
|
||||
|
||||
STATUS TFModelParser::ConvertConstVariant(const tensorflow::TensorProto &tensor_proto,
|
||||
const ParamValueLitePtr ¶m_value) {
|
||||
STATUS TFModelParser::ConvertConstVariant(const tensorflow::TensorProto &tensor_proto, tensor::TensorPtr *tensor_info) {
|
||||
if (tensor_proto.variant_val_size() != 1) {
|
||||
MS_LOG(ERROR) << "only support variant_val_size == 1 now";
|
||||
return RET_ERROR;
|
||||
|
@ -211,23 +315,6 @@ STATUS TFModelParser::ConvertConstVariant(const tensorflow::TensorProto &tensor_
|
|||
tensorflow::TensorShapeProto element_shape_proto;
|
||||
element_shape_proto.ParseFromString(std::string(str_view.data(), str_view.size()));
|
||||
auto dim_size = element_shape_proto.dim_size();
|
||||
auto tensor_data = new (std::nothrow) int[dim_size + 2]; // encode element_dtype,shape.size,shape[i]... into data
|
||||
if (tensor_data == nullptr) {
|
||||
MS_LOG(ERROR) << "tensor_data is nullptr";
|
||||
return RET_ERROR;
|
||||
}
|
||||
tensor_data[0] = TensorFlowUtils::GetTFDataType(tensorflow::DataType(element_dtype));
|
||||
tensor_data[1] = element_shape_proto.dim_size();
|
||||
for (int i = 0; i < dim_size; ++i) {
|
||||
auto dim = element_shape_proto.dim(i).size();
|
||||
if (dim > static_cast<int64_t>(INT32_MAX) || dim < static_cast<int64_t>(INT32_MIN)) {
|
||||
MS_LOG(ERROR) << "int64 data " << dim << " too big to fit into int32";
|
||||
delete[] tensor_data;
|
||||
return RET_ERROR;
|
||||
} else {
|
||||
tensor_data[i + 2] = static_cast<int>(dim);
|
||||
}
|
||||
}
|
||||
std::vector<int> tensor_list_data(dim_size + 2);
|
||||
tensor_list_data[0] = TensorFlowUtils::GetTFDataType(tensorflow::DataType(element_dtype));
|
||||
tensor_list_data[1] = element_shape_proto.dim_size();
|
||||
|
@ -235,7 +322,6 @@ STATUS TFModelParser::ConvertConstVariant(const tensorflow::TensorProto &tensor_
|
|||
auto dim = element_shape_proto.dim(i).size();
|
||||
if (dim > static_cast<int64_t>(INT32_MAX) || dim < static_cast<int64_t>(INT32_MIN)) {
|
||||
MS_LOG(ERROR) << "int64 data " << dim << " too big to fit into int32";
|
||||
delete[] tensor_data;
|
||||
return RET_ERROR;
|
||||
} else {
|
||||
tensor_list_data[i + 2] = static_cast<int>(dim);
|
||||
|
@ -250,51 +336,30 @@ STATUS TFModelParser::ConvertConstVariant(const tensorflow::TensorProto &tensor_
|
|||
}
|
||||
tensor_list_data.insert(tensor_list_data.end(), single_tensor_data.begin(), single_tensor_data.end());
|
||||
}
|
||||
auto tensor_data_ptr = new (std::nothrow) int[tensor_list_data.size()];
|
||||
if (tensor_data_ptr == nullptr) {
|
||||
MS_LOG(ERROR) << "tensor_data is nullptr";
|
||||
return RET_NULL_PTR;
|
||||
*tensor_info = CreateTensorInfo(tensor_list_data.data(), tensor_list_data.size() * sizeof(int),
|
||||
{static_cast<int64_t>(tensor_list_data.size())}, kObjectTypeTensorType);
|
||||
if (*tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "create tensor data failed.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
if (EOK != ::memcpy_s(tensor_data_ptr, tensor_list_data.size() * sizeof(int), tensor_list_data.data(),
|
||||
tensor_list_data.size() * sizeof(int))) {
|
||||
MS_LOG(ERROR) << "memcpy_s failed";
|
||||
return RET_NULL_PTR;
|
||||
}
|
||||
param_value->SetTensorData(tensor_data_ptr, tensor_list_data.size() * sizeof(int));
|
||||
return RET_OK;
|
||||
}
|
||||
|
||||
STATUS TFModelParser::GetValueFromType(const tensorflow::TensorProto &tensor_proto,
|
||||
const tensorflow::TensorShapeProto &tensor_shape, ParamValueLitePtr param_value,
|
||||
const TypeId &type, int shape_size) {
|
||||
STATUS TFModelParser::SetTensorInfoFromType(const tensorflow::TensorProto &tensor_proto,
|
||||
tensor::TensorPtr *tensor_info) {
|
||||
auto type = (*tensor_info)->data_type();
|
||||
if (type == kNumberTypeFloat32 || type == kNumberTypeFloat) {
|
||||
return GetFloatValue(tensor_proto, tensor_shape, param_value, shape_size);
|
||||
return SetFloatTensorInfo(tensor_proto, tensor_info);
|
||||
} else if (type == kNumberTypeInt32 || type == kNumberTypeInt) {
|
||||
return GetInt32Value(tensor_proto, tensor_shape, param_value, shape_size);
|
||||
return SetInt32TensorInfo(tensor_proto, tensor_info);
|
||||
} else if (type == kNumberTypeInt64) {
|
||||
return GetInt64Value(tensor_proto, tensor_shape, param_value, shape_size);
|
||||
return SetInt64TensorInfo(tensor_proto, tensor_info);
|
||||
} else if (type == kNumberTypeBool) {
|
||||
auto tensor_data = new (std::nothrow) int[shape_size];
|
||||
if (tensor_proto.bool_val_size() == 1) {
|
||||
int value = tensor_proto.bool_val(0);
|
||||
for (int i = 0; i < shape_size; i++) {
|
||||
tensor_data[i] = value;
|
||||
}
|
||||
}
|
||||
auto tensor_size = shape_size * sizeof(int);
|
||||
param_value->SetTensorData(tensor_data, tensor_size);
|
||||
return SetBoolTensorInfo(tensor_proto, tensor_info);
|
||||
} else if (type == kObjectTypeTensorType) {
|
||||
return ConvertConstVariant(tensor_proto, param_value);
|
||||
return ConvertConstVariant(tensor_proto, tensor_info);
|
||||
} else if (type == kObjectTypeString) {
|
||||
auto tensor_data = new (std::nothrow) string;
|
||||
if (tensor_proto.string_val_size() == 1) {
|
||||
*tensor_data = tensor_proto.string_val(0);
|
||||
} else {
|
||||
MS_LOG(ERROR) << "string size bigger than one, not support.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto tensor_size = (*tensor_data).size();
|
||||
param_value->SetTensorData(tensor_data, tensor_size);
|
||||
return SetStringTensorInfo(tensor_proto, tensor_info);
|
||||
} else {
|
||||
MS_LOG(ERROR) << "Unsupported dataType: " << type;
|
||||
return RET_ERROR;
|
||||
|
@ -309,35 +374,25 @@ STATUS TFModelParser::ConvertConstTensor(const tensorflow::NodeDef &node_def, co
|
|||
MS_ASSERT(shape_vector != nullptr);
|
||||
const tensorflow::TensorProto &tensor_proto = attr_value.tensor();
|
||||
const tensorflow::TensorShapeProto &tensor_shape = tensor_proto.tensor_shape();
|
||||
int shape_size = 1;
|
||||
shape_vector->clear();
|
||||
for (int i = 0; i < tensor_shape.dim_size(); i++) {
|
||||
shape_vector->push_back(tensor_shape.dim(i).size());
|
||||
shape_size *= tensor_shape.dim(i).size();
|
||||
}
|
||||
|
||||
auto param_value = std::make_shared<ParamValueLite>();
|
||||
if (param_value == nullptr) {
|
||||
MS_LOG(ERROR) << "param_value is nullptr";
|
||||
auto tensor_info = std::make_shared<tensor::Tensor>(type, *shape_vector);
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "tensor info is nullptr";
|
||||
return RET_ERROR;
|
||||
}
|
||||
param_value->set_tensor_type(type);
|
||||
if (GetValueFromType(tensor_proto, tensor_shape, param_value, type, shape_size) != RET_OK) {
|
||||
MS_LOG(ERROR) << "get value from type failed.";
|
||||
auto status = SetTensorInfoFromType(tensor_proto, &tensor_info);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "set tensor data from type failed.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
std::vector<int> param_shape(shape_vector->begin(), shape_vector->end());
|
||||
param_value->set_tensor_shape(param_shape);
|
||||
if (TensorFlowUtils::FindAttrValue(node_def, "data_format", const_cast<tensorflow::AttrValue *>(&attr_value))) {
|
||||
auto format = mindspore::lite::TensorFlowUtils::ParseNodeFormat(node_def);
|
||||
if (format == mindspore::Format::NUM_OF_FORMAT) {
|
||||
MS_LOG(ERROR) << "Do not support data format: " << attr_value.s();
|
||||
}
|
||||
param_value->set_format(format);
|
||||
} else {
|
||||
param_value->set_format(schema::Format::Format_NHWC);
|
||||
status = InitParameterFromTensorInfo(parameter, tensor_info);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "init parameter from tensor info failed.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
parameter->set_default_param(param_value);
|
||||
return RET_OK;
|
||||
}
|
||||
|
||||
|
@ -365,6 +420,7 @@ STATUS TFModelParser::ConvertParameter(const tensorflow::NodeDef &node, const Pa
|
|||
MS_LOG(INFO) << "Found value attr, means it has default value";
|
||||
auto status = ConvertConstTensor(node, attr_value, type, parameter, &shape_vector);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "convert const tensor failed.";
|
||||
return status;
|
||||
}
|
||||
} else {
|
||||
|
|
|
@ -29,7 +29,6 @@
|
|||
#include "securec/include/securec.h"
|
||||
#include "tools/common/tensor_util.h"
|
||||
#include "tools/converter/model_parser.h"
|
||||
#include "src/param_value_lite.h"
|
||||
|
||||
namespace mindspore {
|
||||
namespace lite {
|
||||
|
@ -41,12 +40,10 @@ class TFModelParser : public ModelParser {
|
|||
FuncGraphPtr Parse(const std::string &modelFile, const std::string &weightFile, const QuantType &quantType);
|
||||
|
||||
private:
|
||||
static STATUS ConvertConstVariant(const tensorflow::TensorProto &tensor_proto, const ParamValueLitePtr ¶m_value);
|
||||
static STATUS ConvertConstVariant(const tensorflow::TensorProto &tensor_proto, tensor::TensorPtr *tensor_info);
|
||||
STATUS ConvertConstTensor(const tensorflow::NodeDef &node_def, const tensorflow::AttrValue &attr_value,
|
||||
const TypeId &type, const ParameterPtr ¶meter, std::vector<int64_t> *shape_vector);
|
||||
static STATUS GetValueFromType(const tensorflow::TensorProto &tensor_proto,
|
||||
const tensorflow::TensorShapeProto &tensor_shape, ParamValueLitePtr param_value,
|
||||
const TypeId &type, int shape_size);
|
||||
static STATUS SetTensorInfoFromType(const tensorflow::TensorProto &tensor_proto, tensor::TensorPtr *tensor_info);
|
||||
STATUS ConvertParameter(const tensorflow::NodeDef &node, const ParameterPtr ¶meter,
|
||||
std::unordered_map<std::string, AnfNodePtr> *anf_node_map);
|
||||
STATUS ConvertGraphInputsAndConsts(const std::map<std::string, const tensorflow::NodeDef *> &tf_graph_nodes,
|
||||
|
|
|
@ -20,7 +20,6 @@
|
|||
#include <algorithm>
|
||||
#include <utility>
|
||||
#include "tools/converter/converter_flags.h"
|
||||
#include "src/param_value_lite.h"
|
||||
#include "src/common/file_utils.h"
|
||||
#include "ops/return.h"
|
||||
#include "ops/make_tuple.h"
|
||||
|
@ -160,7 +159,7 @@ STATUS TfliteModelParser::ConvertOps() {
|
|||
tensor_name = GetTensorName(i, tflite_op_type, op_name);
|
||||
}
|
||||
auto parameter = func_graph_->add_parameter();
|
||||
status = ConvertConstTensor(input_tensor.get(), parameter.get(), tensor_name);
|
||||
status = ConvertConstTensor(input_tensor.get(), parameter, tensor_name);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "convert " << op_name << " node: " << input_idx << " const node failed.";
|
||||
continue;
|
||||
|
@ -354,7 +353,7 @@ STATUS TfliteModelParser::ConvertGraphOutputs() {
|
|||
return RET_OK;
|
||||
}
|
||||
|
||||
STATUS TfliteModelParser::ConvertConstTensor(const tflite::TensorT *tensor, Parameter *parameter,
|
||||
STATUS TfliteModelParser::ConvertConstTensor(const tflite::TensorT *tensor, const ParameterPtr ¶meter,
|
||||
const std::string &tensor_name) {
|
||||
if (tensor == nullptr) {
|
||||
MS_LOG(ERROR) << "tensor is null, get const tensor failed.";
|
||||
|
@ -366,31 +365,53 @@ STATUS TfliteModelParser::ConvertConstTensor(const tflite::TensorT *tensor, Para
|
|||
return RET_NULL_PTR;
|
||||
}
|
||||
const auto &tflite_model_buffers = tflite_model_->buffers;
|
||||
auto type_ptr = TypeIdToType(GetTfliteDataType(tensor->type));
|
||||
auto type_id = GetTfliteDataType(tensor->type);
|
||||
std::vector<int64_t> shape_vector;
|
||||
(void)std::transform(tensor->shape.begin(), tensor->shape.end(), std::back_inserter(shape_vector),
|
||||
[](const int32_t &value) { return static_cast<int64_t>(value); });
|
||||
auto abstract_tensor = std::make_shared<abstract::AbstractTensor>(type_ptr, shape_vector);
|
||||
parameter->set_abstract(abstract_tensor);
|
||||
parameter->set_name(tensor_name);
|
||||
|
||||
ParamValueLitePtr param_value = std::make_shared<ParamValueLite>();
|
||||
MS_ASSERT(param_value != nullptr);
|
||||
param_value->set_tensor_shape(tensor->shape);
|
||||
param_value->set_tensor_type(GetTfliteDataType(tensor->type));
|
||||
param_value->set_format(schema::Format::Format_NHWC);
|
||||
const auto &data = tflite_model_buffers.at(tensor->buffer)->data;
|
||||
if (!data.empty()) {
|
||||
auto size = data.size();
|
||||
char *tensor_data = new (std::nothrow) char[size];
|
||||
if (tensor_data == nullptr) {
|
||||
MS_LOG(ERROR) << "new char[] failed";
|
||||
return RET_MEMORY_FAILED;
|
||||
std::string shape_str;
|
||||
if (data.empty()) {
|
||||
shape_vector = {};
|
||||
} else if (type_id == kObjectTypeString) {
|
||||
shape_str += std::to_string(tensor->shape.size()) + ",";
|
||||
for (auto &dim : tensor->shape) {
|
||||
shape_str += std::to_string(dim) + ",";
|
||||
}
|
||||
std::memcpy(tensor_data, data.data(), size);
|
||||
param_value->SetTensorData(tensor_data, size);
|
||||
shape_vector = {static_cast<int64_t>(shape_str.size() + data.size())};
|
||||
} else {
|
||||
(void)std::transform(tensor->shape.begin(), tensor->shape.end(), std::back_inserter(shape_vector),
|
||||
[](const int32_t &value) { return static_cast<int64_t>(value); });
|
||||
}
|
||||
parameter->set_default_param(param_value);
|
||||
|
||||
auto tensor_info = CreateTensorInfo(nullptr, 0, shape_vector, type_id);
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "init tensor info failed";
|
||||
return RET_NULL_PTR;
|
||||
}
|
||||
if (!data.empty()) {
|
||||
auto tensor_data = reinterpret_cast<uint8_t *>(tensor_info->data_c());
|
||||
if (type_id == kObjectTypeString) {
|
||||
if (memcpy_s(tensor_data, shape_str.size(), shape_str.data(), shape_str.size()) != EOK) {
|
||||
MS_LOG(ERROR) << "memcpy failed.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
if (memcpy_s(tensor_data + shape_str.size(), data.size(), data.data(), data.size()) != EOK) {
|
||||
MS_LOG(ERROR) << "memcpy failed.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
} else {
|
||||
if (memcpy_s(tensor_data, tensor_info->Size(), data.data(), data.size()) != EOK) {
|
||||
MS_LOG(ERROR) << "memcpy failed.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
}
|
||||
}
|
||||
auto status = InitParameterFromTensorInfo(parameter, tensor_info);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "init parameter from tensor info failed.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
parameter->set_name(tensor_name);
|
||||
return RET_OK;
|
||||
}
|
||||
|
||||
|
|
|
@ -41,7 +41,8 @@ class TfliteModelParser : public ModelParser {
|
|||
FuncGraphPtr func_graph_;
|
||||
char *tflite_model_buf_ = nullptr;
|
||||
std::unique_ptr<tflite::ModelT> ReadTfliteModel(const char *model_path);
|
||||
STATUS ConvertConstTensor(const tflite::TensorT *tensor, Parameter *parameter, const std::string &tensor_name);
|
||||
STATUS ConvertConstTensor(const tflite::TensorT *tensor, const ParameterPtr ¶meter,
|
||||
const std::string &tensor_name);
|
||||
STATUS ConvertOutputTensor(const tflite::OperatorT *op, const CNodePtr &dst_cnode);
|
||||
STATUS ConvertOpQuantParams(const tflite::OperatorT *op, ops::PrimitiveC *primitive_c);
|
||||
STATUS ConvertOps();
|
||||
|
|
|
@ -15,21 +15,20 @@
|
|||
*/
|
||||
|
||||
#include "tools/converter/quantizer/huffman_encode.h"
|
||||
#include <utility>
|
||||
#include "src/dequant.h"
|
||||
#include "tools/converter/quantizer/quantize_util.h"
|
||||
|
||||
namespace mindspore {
|
||||
namespace lite {
|
||||
STATUS HuffmanEncode::DoHuffmanEncode(const ParamValueLitePtr &weight, const PrimitivePtr &primitive, void *quant_datas,
|
||||
STATUS HuffmanEncode::DoHuffmanEncode(const tensor::TensorPtr &weight, const PrimitivePtr &primitive, void *quant_datas,
|
||||
const size_t &bit_num) {
|
||||
if (quant_datas == nullptr) {
|
||||
MS_LOG(ERROR) << "quant data is nullptr";
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto *raw_datas = static_cast<int8_t *>(quant_datas);
|
||||
size_t elem_count = weight->tensor_shape_size();
|
||||
size_t packed_size = elem_count * bit_num;
|
||||
size_t elem_count = weight->DataSize();
|
||||
int packed_size = elem_count * bit_num;
|
||||
|
||||
HuffmanPriorityQueue pq;
|
||||
auto status = GetHuffmanPriorityQueue(raw_datas, elem_count, &pq);
|
||||
|
@ -47,19 +46,16 @@ STATUS HuffmanEncode::DoHuffmanEncode(const ParamValueLitePtr &weight, const Pri
|
|||
MS_LOG(ERROR) << "DoHuffmanCompress failed";
|
||||
return status;
|
||||
}
|
||||
size_t ch_size = huffman_encoded_str_.length();
|
||||
int ch_size = huffman_encoded_str_.length();
|
||||
if (ch_size < packed_size) {
|
||||
auto encode_data = new (std::nothrow) char[ch_size];
|
||||
if (encode_data == nullptr) {
|
||||
MS_LOG(ERROR) << "new char[] failed.";
|
||||
return RET_MEMORY_FAILED;
|
||||
if (ch_size != weight->data().nbytes()) {
|
||||
MS_LOG(ERROR) << "Data size of weight is error.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
if (memcpy_s(encode_data, ch_size, huffman_encoded_str_.c_str(), ch_size) != EOK) {
|
||||
if (memcpy_s(weight->data_c(), weight->data().nbytes(), huffman_encoded_str_.c_str(), ch_size) != EOK) {
|
||||
MS_LOG(ERROR) << "memcpy_s failed.";
|
||||
delete[] encode_data;
|
||||
return RET_MEMORY_FAILED;
|
||||
}
|
||||
weight->SetTensorData(encode_data, ch_size);
|
||||
auto quant_param_holder = quant::GetCNodeQuantHolder(primitive);
|
||||
MS_ASSERT(quant_param_holder != nullptr);
|
||||
quant_param_holder->set_enable_huffman_code(true);
|
||||
|
|
|
@ -29,7 +29,6 @@
|
|||
#include "schema/inner/model_generated.h"
|
||||
#include "securec/include/securec.h"
|
||||
#include "src/common/log_adapter.h"
|
||||
#include "src/param_value_lite.h"
|
||||
|
||||
namespace mindspore {
|
||||
namespace lite {
|
||||
|
@ -58,7 +57,7 @@ class HuffmanEncode {
|
|||
|
||||
~HuffmanEncode();
|
||||
|
||||
STATUS DoHuffmanEncode(const ParamValueLitePtr &weight, const PrimitivePtr &primitive, void *quant_datas,
|
||||
STATUS DoHuffmanEncode(const tensor::TensorPtr &weight, const PrimitivePtr &primitive, void *quant_datas,
|
||||
const size_t &bit_num);
|
||||
|
||||
private:
|
||||
|
|
|
@ -565,8 +565,8 @@ STATUS PostTrainingQuantizer::DoWeightQuant(const std::string &op_name, const An
|
|||
MS_LOG(ERROR) << weight->fullname_with_scope() << " can not cast to Parameter";
|
||||
return RET_NULL_PTR;
|
||||
}
|
||||
ParamValueLitePtr paramValue = std::dynamic_pointer_cast<ParamValueLite>(parameter->default_param());
|
||||
if (paramValue == nullptr) {
|
||||
tensor::TensorPtr tensor_info = std::dynamic_pointer_cast<tensor::Tensor>(parameter->default_param());
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << weight->fullname_with_scope() << " can not get value";
|
||||
return RET_NULL_PTR;
|
||||
}
|
||||
|
@ -583,8 +583,8 @@ STATUS PostTrainingQuantizer::DoWeightQuant(const std::string &op_name, const An
|
|||
quant_min_t = -(1 << (unsigned int)(bit_num_t - 1));
|
||||
}
|
||||
}
|
||||
auto status =
|
||||
QuantFilter<int8_t>(paramValue, primitive, QuantType_PostTraining, quant_max_t, quant_min_t, bit_num_t, perchanel);
|
||||
auto status = QuantFilter<int8_t>(tensor_info, primitive, QuantType_PostTraining, quant_max_t, quant_min_t, bit_num_t,
|
||||
perchanel, kNumberTypeInt8);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "QuantFilter failed: " << status;
|
||||
return status;
|
||||
|
@ -616,8 +616,8 @@ STATUS PostTrainingQuantizer::DoBiasQuant(const AnfNodePtr &bias, const Primitiv
|
|||
auto bias_parameter_ptr = std::dynamic_pointer_cast<Parameter>(bias);
|
||||
MS_ASSERT(bias_parameter_ptr != nullptr);
|
||||
auto bias_default_param = bias_parameter_ptr->default_param();
|
||||
auto bias_param = std::dynamic_pointer_cast<ParamValueLite>(bias_default_param);
|
||||
MS_ASSERT(bias_parameter_ptr != nullptr);
|
||||
auto bias_param = std::dynamic_pointer_cast<tensor::Tensor>(bias_default_param);
|
||||
MS_ASSERT(bias_parameter != nullptr);
|
||||
auto quant_param_holder = GetCNodeQuantHolder(primitive);
|
||||
MS_ASSERT(quant_param_holder != nullptr);
|
||||
auto active_weight_quant_params = quant_param_holder->input_quant_params();
|
||||
|
@ -653,7 +653,7 @@ STATUS PostTrainingQuantizer::DoBiasQuant(const AnfNodePtr &bias, const Primitiv
|
|||
bias_scales.push_back(scaleX * scaleY);
|
||||
}
|
||||
MS_ASSERT(!bias_scales.empty());
|
||||
size_t shape_size = bias_param->tensor_shape_size();
|
||||
size_t shape_size = bias_param->DataSize();
|
||||
|
||||
// set bias quant param
|
||||
std::vector<schema::QuantParamT> quant_params;
|
||||
|
@ -667,17 +667,16 @@ STATUS PostTrainingQuantizer::DoBiasQuant(const AnfNodePtr &bias, const Primitiv
|
|||
// quant bias data
|
||||
std::vector<int32_t> quant_datas(shape_size);
|
||||
|
||||
auto *raw_datas = static_cast<float *>(bias_param->tensor_addr());
|
||||
auto *raw_datas = static_cast<float *>(bias_param->data_c());
|
||||
if (ComputeBiasDataAndQuantParam(bias_scales, input_scales, raw_datas, quant_param_holder, &quant_params,
|
||||
&quant_datas) != RET_OK) {
|
||||
MS_LOG(ERROR) << "compute bias data failed.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
quant_param_holder->AddInputQuantParam(quant_params);
|
||||
auto ret =
|
||||
memcpy_s(bias_param->tensor_addr(), bias_param->tensor_size(), quant_datas.data(), shape_size * sizeof(int32_t));
|
||||
if (ret != EOK) {
|
||||
MS_LOG(ERROR) << "memcpy_s failed.";
|
||||
auto ret = SetTensorData(bias_param, quant_datas.data(), shape_size * sizeof(int32_t));
|
||||
if (ret != RET_OK) {
|
||||
MS_LOG(ERROR) << "set tensor data failed.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
// set dtype
|
||||
|
@ -1133,11 +1132,11 @@ STATUS PostTrainingQuantizer::BiasCorrection(const FuncGraphPtr &func_graph, con
|
|||
auto bias = cnode->input(3);
|
||||
auto bias_parameter_ptr = std::dynamic_pointer_cast<Parameter>(bias);
|
||||
auto bias_default_param = bias_parameter_ptr->default_param();
|
||||
auto bias_param = std::dynamic_pointer_cast<ParamValueLite>(bias_default_param);
|
||||
int *bias_datas = static_cast<int *>(bias_param->tensor_addr());
|
||||
auto bias_param = std::dynamic_pointer_cast<tensor::Tensor>(bias_default_param);
|
||||
int *bias_datas = static_cast<int *>(bias_param->data_c());
|
||||
|
||||
if (static_cast<size_t>(bias_param->tensor_shape_size()) != bias_diff.size()) {
|
||||
MS_LOG(DEBUG) << "unexpected bias data count: " << bias_param->tensor_shape_size()
|
||||
if (static_cast<size_t>(bias_param->DataSize()) != bias_diff.size()) {
|
||||
MS_LOG(DEBUG) << "unexpected bias data count: " << bias_param->DataSize()
|
||||
<< " not the same as bias_diff: " << bias_diff.size();
|
||||
return RET_ERROR;
|
||||
}
|
||||
|
@ -1146,7 +1145,7 @@ STATUS PostTrainingQuantizer::BiasCorrection(const FuncGraphPtr &func_graph, con
|
|||
<< " not the same as bias_diff: " << bias_diff.size();
|
||||
return RET_ERROR;
|
||||
}
|
||||
for (int i = 0; i < bias_param->tensor_shape_size(); i++) {
|
||||
for (int i = 0; i < bias_param->DataSize(); i++) {
|
||||
auto scale = bias_quant_params[i].scale;
|
||||
if (fabs(scale) <= 0.0f) {
|
||||
MS_LOG(ERROR) << "divisor 'scale' cannot be 0.";
|
||||
|
@ -1177,36 +1176,20 @@ STATUS PostTrainingQuantizer::BiasCorrection(const FuncGraphPtr &func_graph, con
|
|||
}
|
||||
ShapeVector shape;
|
||||
shape.push_back(bias_diff.size());
|
||||
auto type_ptr = TypeIdToType(kNumberTypeFloat32);
|
||||
auto abstract_tensor = std::make_shared<abstract::AbstractTensor>(type_ptr, shape);
|
||||
parameter->set_abstract(abstract_tensor);
|
||||
parameter->set_name("added_" + op_name + "_bias");
|
||||
|
||||
ParamValueLitePtr param_value = std::make_shared<ParamValueLite>();
|
||||
MS_ASSERT(param_value != nullptr);
|
||||
std::vector<int32_t> shape_vector;
|
||||
(void)std::transform(shape.begin(), shape.end(), std::back_inserter(shape_vector),
|
||||
[](const int64_t &value) { return static_cast<int32_t>(value); });
|
||||
param_value->set_tensor_shape(shape_vector);
|
||||
param_value->set_tensor_type(kNumberTypeFloat32);
|
||||
|
||||
auto size = sizeof(float) * bias_diff.size();
|
||||
char *tensor_data = new (std::nothrow) char[size];
|
||||
if (tensor_data == nullptr) {
|
||||
MS_LOG(ERROR) << "new char[] failed";
|
||||
return RET_MEMORY_FAILED;
|
||||
}
|
||||
STATUS status = memcpy_s(tensor_data, size * sizeof(char), bias_diff.data(), size * sizeof(char));
|
||||
if (status != EOK) {
|
||||
MS_LOG(ERROR) << "memcpy_s error: " << status;
|
||||
delete[] tensor_data;
|
||||
auto tensor_info = CreateTensorInfo(bias_diff.data(), sizeof(float) * bias_diff.size(), shape, kNumberTypeFloat32);
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "create tensor info failed.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
param_value->SetTensorData(tensor_data, size);
|
||||
parameter->set_default_param(param_value);
|
||||
auto status = InitParameterFromTensorInfo(parameter, tensor_info);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "init parameter from tensor info failed";
|
||||
return RET_ERROR;
|
||||
}
|
||||
parameter->set_name("added_" + op_name + "_bias");
|
||||
cnode->add_input(parameter);
|
||||
DoBiasQuant(parameter, primitive);
|
||||
delete[] tensor_data;
|
||||
} else {
|
||||
MS_LOG(ERROR) << "unexpected input_quant_params size: " << input_quant_params.size();
|
||||
}
|
||||
|
|
|
@ -45,6 +45,7 @@
|
|||
#include "tools/anf_exporter/anf_exporter.h"
|
||||
#include "tools/converter/quantizer/bitpacking.h"
|
||||
#include "src/common/utils.h"
|
||||
#include "tools/common/tensor_util.h"
|
||||
#include "abstract/abstract_value.h"
|
||||
#include "securec/include/securec.h"
|
||||
|
||||
|
@ -861,49 +862,39 @@ FuncGraphPtr CopyFuncGraph(const FuncGraphPtr &func_graph) {
|
|||
}
|
||||
auto old_cnode = old_cnode_iter->second;
|
||||
auto inputs = cnode->inputs();
|
||||
for (size_t i = 0; i < inputs.size(); i++) {
|
||||
auto input_node = inputs[i];
|
||||
for (const auto &input_node : inputs) {
|
||||
if (input_node->isa<Parameter>()) {
|
||||
auto param_node = input_node->cast<ParameterPtr>();
|
||||
if (param_node->has_default()) {
|
||||
ParamValueLitePtr old_param_value = std::static_pointer_cast<ParamValueLite>(param_node->default_param());
|
||||
auto new_param_value = std::make_shared<ParamValueLite>();
|
||||
|
||||
auto copyed_data = malloc(old_param_value->tensor_size());
|
||||
if (copyed_data == nullptr) {
|
||||
MS_LOG(ERROR) << "malloc data error, size: " << old_param_value->tensor_size();
|
||||
return nullptr;
|
||||
}
|
||||
memcpy(copyed_data, old_param_value->tensor_addr(), old_param_value->tensor_size());
|
||||
|
||||
new_param_value->set_tensor_size(old_param_value->tensor_size());
|
||||
new_param_value->set_tensor_addr(copyed_data);
|
||||
new_param_value->set_tensor_shape(old_param_value->tensor_shape());
|
||||
new_param_value->set_format(old_param_value->format());
|
||||
new_param_value->set_tensor_type(old_param_value->tensor_type());
|
||||
|
||||
param_node->set_default_param(new_param_value);
|
||||
}
|
||||
|
||||
auto old_abstract_base = param_node->abstract();
|
||||
if (!utils::isa<abstract::AbstractTensorPtr>(old_abstract_base)) {
|
||||
MS_LOG(ERROR) << "Abstract of parameter should be abstract tensor, " << param_node->name();
|
||||
if (!param_node->has_default()) {
|
||||
MS_LOG(ERROR) << "Param node has no default parameter: " << cnode_name;
|
||||
return nullptr;
|
||||
}
|
||||
auto old_tensor_info = std::static_pointer_cast<tensor::Tensor>(param_node->default_param());
|
||||
if (old_tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "Default param of param node is not a tensor info:" << cnode_name;
|
||||
return nullptr;
|
||||
}
|
||||
auto new_tensor_info = lite::CreateTensorInfo(old_tensor_info->data().data(), old_tensor_info->data().nbytes(),
|
||||
old_tensor_info->shape(), old_tensor_info->data_type());
|
||||
if (new_tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "Create tensor info failed";
|
||||
return nullptr;
|
||||
}
|
||||
auto status = lite::InitParameterFromTensorInfo(param_node, new_tensor_info);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "init parameter from tensor info failed";
|
||||
return nullptr;
|
||||
}
|
||||
auto old_abstract = utils::cast<abstract::AbstractTensorPtr>(old_abstract_base);
|
||||
auto new_abstract = std::make_shared<abstract::AbstractTensor>(old_abstract->element()->GetTypeTrack(),
|
||||
old_abstract->GetShapeTrack());
|
||||
param_node->set_abstract(new_abstract);
|
||||
}
|
||||
} // end inputs loop
|
||||
} // end cnodes loop
|
||||
return new_func_graph;
|
||||
}
|
||||
|
||||
void GetLiteParameter(const AnfNodePtr &node, ParameterPtr *param_node, ParamValueLitePtr *param_value) {
|
||||
void GetLiteParameter(const AnfNodePtr &node, ParameterPtr *param_node, tensor::TensorPtr *tensor_info) {
|
||||
MS_ASSERT(node != nullptr);
|
||||
MS_ASSERT(param_node != nullptr);
|
||||
MS_ASSERT(param_value != nullptr);
|
||||
MS_ASSERT(tensor_info != nullptr);
|
||||
|
||||
auto op_name = node->fullname_with_scope();
|
||||
|
||||
|
@ -917,26 +908,22 @@ void GetLiteParameter(const AnfNodePtr &node, ParameterPtr *param_node, ParamVal
|
|||
return;
|
||||
}
|
||||
|
||||
*param_value = std::static_pointer_cast<ParamValueLite>((*param_node)->default_param());
|
||||
if (*param_value == nullptr) {
|
||||
MS_LOG(INFO) << "default_param can not cast to ParamValueLite";
|
||||
*tensor_info = std::static_pointer_cast<tensor::Tensor>((*param_node)->default_param());
|
||||
if (*tensor_info == nullptr) {
|
||||
MS_LOG(INFO) << "default_param can not cast to tensor::Tensor";
|
||||
return;
|
||||
}
|
||||
}
|
||||
|
||||
STATUS UpdateTensorDataAndSize(ParamValueLitePtr weight, void *quant_datas, int new_size) {
|
||||
STATUS UpdateTensorDataAndSize(const tensor::TensorPtr &weight, void *quant_datas, int new_size, TypeId new_data_type) {
|
||||
MS_ASSERT(weight != nullptr);
|
||||
MS_ASSERT(new_size > 0);
|
||||
delete[] reinterpret_cast<char *>(weight->tensor_addr());
|
||||
char *new_tensor_data = new (std::nothrow) char[new_size];
|
||||
if (new_tensor_data == nullptr) {
|
||||
MS_LOG(ERROR) << "new data error";
|
||||
weight->set_data_type(new_data_type);
|
||||
if (new_size != weight->data().nbytes()) {
|
||||
MS_LOG(ERROR) << "Data size of tensor info is error.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
memcpy(new_tensor_data, quant_datas, new_size);
|
||||
|
||||
weight->set_tensor_size(new_size);
|
||||
weight->set_tensor_addr(new_tensor_data);
|
||||
memcpy(weight->data_c(), quant_datas, new_size);
|
||||
return RET_OK;
|
||||
}
|
||||
|
||||
|
|
|
@ -108,7 +108,7 @@ std::pair<float, float> OutlierMethod(std::vector<float> min_datas, std::vector<
|
|||
|
||||
std::vector<int8_t> KMeans(float *data, size_t elem_count, size_t k, size_t epochs, schema::QuantParamT *quantParam);
|
||||
|
||||
STATUS UpdateTensorDataAndSize(ParamValueLitePtr weight, void *quant_datas, int new_size);
|
||||
STATUS UpdateTensorDataAndSize(const tensor::TensorPtr &weight, void *quant_datas, int new_size, TypeId new_data_type);
|
||||
|
||||
void GetMaxMinPerchannel(int channels, int one_filter_size, int i, int elem_count, const float *raw_datas,
|
||||
bool channel_at_first, float *desired_max, float *desired_min);
|
||||
|
@ -166,13 +166,13 @@ T QuantizeData(float originData, const schema::QuantParamT &quantParam, int quan
|
|||
}
|
||||
|
||||
template <typename T>
|
||||
STATUS DoPerChannelQuant(const ParamValueLitePtr &weight, const QuantType &quant_type,
|
||||
STATUS DoPerChannelQuant(const tensor::TensorPtr &weight, const QuantType &quant_type,
|
||||
std::vector<schema::QuantParamT> *quant_params, const int &quant_max, const int &quant_min,
|
||||
const size_t &bit_num, const bool &k_means, std::vector<T> *quant_datas,
|
||||
std::vector<float> *dequant_datas, bool channel_at_first = true) {
|
||||
auto dims = weight->tensor_shape();
|
||||
size_t elem_count = weight->tensor_shape_size();
|
||||
auto *raw_datas = static_cast<float *>(weight->tensor_addr());
|
||||
std::vector<float> *dequant_datas, TypeId quant_data_type, bool channel_at_first = true) {
|
||||
auto dims = weight->shape();
|
||||
size_t elem_count = weight->DataSize();
|
||||
auto *raw_datas = static_cast<float *>(weight->data_c());
|
||||
auto channels = dims[0];
|
||||
if (!channel_at_first) {
|
||||
if (dims.size() != 2) {
|
||||
|
@ -253,7 +253,7 @@ STATUS DoPerChannelQuant(const ParamValueLitePtr &weight, const QuantType &quant
|
|||
}
|
||||
quant_params->emplace_back(quant_param);
|
||||
}
|
||||
auto status = UpdateTensorDataAndSize(weight, quant_datas->data(), quant_datas->size() * sizeof(T));
|
||||
auto status = UpdateTensorDataAndSize(weight, quant_datas->data(), quant_datas->size() * sizeof(T), quant_data_type);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "UpdateTensorDataAndSize error";
|
||||
return RET_ERROR;
|
||||
|
@ -262,12 +262,13 @@ STATUS DoPerChannelQuant(const ParamValueLitePtr &weight, const QuantType &quant
|
|||
}
|
||||
|
||||
template <typename T>
|
||||
STATUS DoPerLayerQuant(const ParamValueLitePtr &weight, const QuantType &quant_type,
|
||||
STATUS DoPerLayerQuant(const tensor::TensorPtr &weight, const QuantType &quant_type,
|
||||
std::vector<schema::QuantParamT> *quant_params, const int &quant_max, const int &quant_min,
|
||||
const size_t &bit_num, const bool &k_means, std::vector<T> *quant_datas) {
|
||||
auto dims = weight->tensor_shape();
|
||||
size_t elem_count = weight->tensor_shape_size();
|
||||
auto *raw_datas = static_cast<float *>(weight->tensor_addr());
|
||||
const size_t &bit_num, const bool &k_means, std::vector<T> *quant_datas,
|
||||
TypeId quant_data_type) {
|
||||
auto dims = weight->shape();
|
||||
size_t elem_count = weight->DataSize();
|
||||
auto *raw_datas = static_cast<float *>(weight->data_c());
|
||||
float min = FLT_MAX;
|
||||
float max = -FLT_MIN;
|
||||
for (uint32_t i = 0; i < elem_count; i++) {
|
||||
|
@ -293,7 +294,7 @@ STATUS DoPerLayerQuant(const ParamValueLitePtr &weight, const QuantType &quant_t
|
|||
(*quant_datas)[i] = quant_data;
|
||||
}
|
||||
}
|
||||
auto status = UpdateTensorDataAndSize(weight, quant_datas->data(), quant_datas->size() * sizeof(T));
|
||||
auto status = UpdateTensorDataAndSize(weight, quant_datas->data(), quant_datas->size() * sizeof(T), quant_data_type);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "UpdateTensorDataAndSize error";
|
||||
return RET_ERROR;
|
||||
|
@ -301,7 +302,7 @@ STATUS DoPerLayerQuant(const ParamValueLitePtr &weight, const QuantType &quant_t
|
|||
return RET_OK;
|
||||
}
|
||||
template <typename T>
|
||||
STATUS DoBitPack(const ParamValueLitePtr &weight, const size_t &bit_num, const std::vector<T> &quant_datas) {
|
||||
STATUS DoBitPack(const tensor::TensorPtr &weight, const size_t &bit_num, const std::vector<T> &quant_datas) {
|
||||
if (bit_num != 8 && bit_num != 16) {
|
||||
std::vector<T> data{};
|
||||
for (size_t i = 0; i < quant_datas.size(); ++i) {
|
||||
|
@ -310,7 +311,8 @@ STATUS DoBitPack(const ParamValueLitePtr &weight, const size_t &bit_num, const s
|
|||
if (bit_num > 0 && bit_num < 8) {
|
||||
std::vector<uint8_t> pack_data{};
|
||||
BitPack::BitPacking<T, uint8_t>(bit_num, data, &pack_data);
|
||||
auto status = UpdateTensorDataAndSize(weight, pack_data.data(), pack_data.size() * sizeof(uint8_t));
|
||||
auto status =
|
||||
UpdateTensorDataAndSize(weight, pack_data.data(), pack_data.size() * sizeof(uint8_t), kNumberTypeUInt8);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "UpdateTensorDataAndSize error";
|
||||
return RET_ERROR;
|
||||
|
@ -318,7 +320,8 @@ STATUS DoBitPack(const ParamValueLitePtr &weight, const size_t &bit_num, const s
|
|||
} else if (bit_num > 8 && bit_num < 16) {
|
||||
std::vector<uint16_t> pack_data{};
|
||||
BitPack::BitPacking<T, uint16_t>(bit_num, data, &pack_data);
|
||||
auto status = UpdateTensorDataAndSize(weight, pack_data.data(), pack_data.size() * sizeof(uint16_t));
|
||||
auto status =
|
||||
UpdateTensorDataAndSize(weight, pack_data.data(), pack_data.size() * sizeof(uint16_t), kNumberTypeUInt16);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "UpdateTensorDataAndSize error";
|
||||
return RET_ERROR;
|
||||
|
@ -329,11 +332,12 @@ STATUS DoBitPack(const ParamValueLitePtr &weight, const size_t &bit_num, const s
|
|||
}
|
||||
|
||||
template <typename T>
|
||||
STATUS QuantFilter(const ParamValueLitePtr &weight, const PrimitivePtr &primitive, QuantType quant_type, int quant_max,
|
||||
int quant_min, size_t bit_num, bool per_channel, int index = 1, bool k_means = false) {
|
||||
STATUS QuantFilter(const tensor::TensorPtr &weight, const PrimitivePtr &primitive, QuantType quant_type, int quant_max,
|
||||
int quant_min, size_t bit_num, bool per_channel, TypeId quant_data_type, int index = 1,
|
||||
bool k_means = false) {
|
||||
MS_ASSERT(weight != nullptr);
|
||||
MS_ASSERT(primitive != nullptr);
|
||||
auto dims = weight->tensor_shape();
|
||||
auto dims = weight->shape();
|
||||
if (per_channel) {
|
||||
if (dims.size() <= 1) {
|
||||
MS_LOG(WARNING) << "dims is " << dims.size() << " can not per_channel";
|
||||
|
@ -342,8 +346,8 @@ STATUS QuantFilter(const ParamValueLitePtr &weight, const PrimitivePtr &primitiv
|
|||
}
|
||||
|
||||
std::vector<schema::QuantParamT> quant_params;
|
||||
size_t elem_count = weight->tensor_shape_size();
|
||||
auto *raw_data = static_cast<float *>(weight->tensor_addr());
|
||||
size_t elem_count = weight->DataSize();
|
||||
auto *raw_data = static_cast<float *>(weight->data_c());
|
||||
if (raw_data == nullptr) {
|
||||
MS_LOG(ERROR) << "rawDatas is nullptr";
|
||||
return RET_ERROR;
|
||||
|
@ -354,7 +358,7 @@ STATUS QuantFilter(const ParamValueLitePtr &weight, const PrimitivePtr &primitiv
|
|||
int ret = RET_OK;
|
||||
if (per_channel) {
|
||||
bool channel_at_first = true;
|
||||
if (primitive->name() == ops::kNameMatMul && weight->tensor_shape().size() == 2) {
|
||||
if (primitive->name() == ops::kNameMatMul && weight->shape().size() == 2) {
|
||||
auto matmul_prim = primitive->cast<std::shared_ptr<ops::MatMul>>();
|
||||
MS_ASSERT(matmul_prim != nullptr);
|
||||
channel_at_first =
|
||||
|
@ -362,7 +366,7 @@ STATUS QuantFilter(const ParamValueLitePtr &weight, const PrimitivePtr &primitiv
|
|||
}
|
||||
// channel at first
|
||||
ret = DoPerChannelQuant<T>(weight, quant_type, &quant_params, quant_max, quant_min, bit_num, k_means, &quant_data,
|
||||
&dequant_datas, channel_at_first);
|
||||
&dequant_datas, quant_data_type, channel_at_first);
|
||||
if (ret == RET_CONTINUE) {
|
||||
return ret;
|
||||
} else if (ret != RET_OK) {
|
||||
|
@ -370,7 +374,8 @@ STATUS QuantFilter(const ParamValueLitePtr &weight, const PrimitivePtr &primitiv
|
|||
return ret;
|
||||
}
|
||||
} else {
|
||||
ret = DoPerLayerQuant<T>(weight, quant_type, &quant_params, quant_max, quant_min, bit_num, k_means, &quant_data);
|
||||
ret = DoPerLayerQuant<T>(weight, quant_type, &quant_params, quant_max, quant_min, bit_num, k_means, &quant_data,
|
||||
quant_data_type);
|
||||
if (ret != RET_OK) {
|
||||
MS_LOG(ERROR) << "Do per layer quant failed.";
|
||||
return ret;
|
||||
|
@ -422,6 +427,6 @@ STATUS CopyInputDataToTensor(size_t input_index, size_t image_index,
|
|||
|
||||
FuncGraphPtr CopyFuncGraph(const FuncGraphPtr &);
|
||||
|
||||
void GetLiteParameter(const AnfNodePtr &node, ParameterPtr *param_node, ParamValueLitePtr *param_value);
|
||||
void GetLiteParameter(const AnfNodePtr &node, ParameterPtr *param_node, tensor::TensorPtr *tensor_info);
|
||||
} // namespace mindspore::lite::quant
|
||||
#endif
|
||||
|
|
|
@ -25,7 +25,6 @@
|
|||
#include "ir/func_graph.h"
|
||||
#include "ir/anf.h"
|
||||
#include "base/base.h"
|
||||
#include "src/param_value_lite.h"
|
||||
#include "tools/converter/converter_flags.h"
|
||||
#include "tools/converter/quant_param_holder.h"
|
||||
|
||||
|
|
|
@ -57,10 +57,10 @@ WeightQuantizer::~WeightQuantizer() {
|
|||
}
|
||||
}
|
||||
|
||||
STATUS WeightQuantizer::SetAbstract(ParamValueLitePtr param_value, ParameterPtr param_node,
|
||||
STATUS WeightQuantizer::SetAbstract(const tensor::TensorPtr &tensor_info, const ParameterPtr ¶m_node,
|
||||
const PrimitivePtr &primitive) {
|
||||
// set dtype
|
||||
param_value->set_tensor_type(type_id_);
|
||||
tensor_info->set_data_type(type_id_);
|
||||
auto abstract_base = param_node->abstract();
|
||||
if (abstract_base == nullptr) {
|
||||
MS_LOG(ERROR) << "Abstract of parameter is nullptr, " << param_node->name();
|
||||
|
@ -78,7 +78,7 @@ STATUS WeightQuantizer::SetAbstract(ParamValueLitePtr param_value, ParameterPtr
|
|||
return RET_OK;
|
||||
}
|
||||
|
||||
STATUS WeightQuantizer::DoConvQuantize(CNodePtr cnode) {
|
||||
STATUS WeightQuantizer::DoConvQuantize(const CNodePtr &cnode) {
|
||||
auto primitive = GetValueNode<PrimitivePtr>(cnode->input(0));
|
||||
if (primitive == nullptr) {
|
||||
MS_LOG(ERROR) << "primitive is nullptr";
|
||||
|
@ -91,24 +91,25 @@ STATUS WeightQuantizer::DoConvQuantize(CNodePtr cnode) {
|
|||
}
|
||||
|
||||
ParameterPtr param_node;
|
||||
ParamValueLitePtr param_value;
|
||||
tensor::TensorPtr tensor_info;
|
||||
|
||||
GetLiteParameter(input_node, ¶m_node, ¶m_value);
|
||||
if (param_node == nullptr || param_value == nullptr) {
|
||||
GetLiteParameter(input_node, ¶m_node, &tensor_info);
|
||||
if (param_node == nullptr || tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "GetLiteParameter error";
|
||||
return RET_ERROR;
|
||||
}
|
||||
|
||||
if (param_value->tensor_type() != mindspore::kNumberTypeFloat32) {
|
||||
MS_LOG(ERROR) << "model weight data type invalid which is " << param_value->tensor_type();
|
||||
if (tensor_info->data_type() != mindspore::kNumberTypeFloat32) {
|
||||
MS_LOG(ERROR) << "model weight data type invalid which is " << tensor_info->data_type();
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto status = RET_ERROR;
|
||||
if (type_id_ == kNumberTypeInt8) {
|
||||
status = QuantFilter<int8_t>(param_value, primitive, QuantType_WeightQuant, quant_max_, quant_min_, bit_num_, true);
|
||||
status = QuantFilter<int8_t>(tensor_info, primitive, QuantType_WeightQuant, quant_max_, quant_min_, bit_num_, true,
|
||||
type_id_);
|
||||
} else if (type_id_ == kNumberTypeInt16) {
|
||||
status =
|
||||
QuantFilter<int16_t>(param_value, primitive, QuantType_WeightQuant, quant_max_, quant_min_, bit_num_, true);
|
||||
status = QuantFilter<int16_t>(tensor_info, primitive, QuantType_WeightQuant, quant_max_, quant_min_, bit_num_, true,
|
||||
type_id_);
|
||||
}
|
||||
if (status == RET_CONTINUE) {
|
||||
return RET_OK;
|
||||
|
@ -116,7 +117,7 @@ STATUS WeightQuantizer::DoConvQuantize(CNodePtr cnode) {
|
|||
MS_LOG(ERROR) << "QuantFilter failed : " << status;
|
||||
return status;
|
||||
}
|
||||
status = SetAbstract(param_value, param_node, primitive);
|
||||
status = SetAbstract(tensor_info, param_node, primitive);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "SetAbstract failed : " << status;
|
||||
return RET_ERROR;
|
||||
|
@ -124,9 +125,9 @@ STATUS WeightQuantizer::DoConvQuantize(CNodePtr cnode) {
|
|||
return RET_OK;
|
||||
}
|
||||
|
||||
STATUS WeightQuantizer::DoMulQuantize(CNodePtr cnode) {
|
||||
STATUS WeightQuantizer::DoMulQuantize(const CNodePtr &cnode) {
|
||||
auto already_quant = false;
|
||||
ParamValueLitePtr param_value = nullptr;
|
||||
tensor::TensorPtr tensor_info = nullptr;
|
||||
ParameterPtr param_node = nullptr;
|
||||
int index = 0;
|
||||
for (size_t i = 1; i < cnode->size(); i++) {
|
||||
|
@ -134,18 +135,18 @@ STATUS WeightQuantizer::DoMulQuantize(CNodePtr cnode) {
|
|||
if (inputNode->isa<Parameter>()) {
|
||||
param_node = inputNode->cast<ParameterPtr>();
|
||||
if ((param_node != nullptr) && param_node->has_default()) {
|
||||
param_value = std::static_pointer_cast<ParamValueLite>(param_node->default_param());
|
||||
if ((param_value == nullptr) || (param_value->tensor_size() == 0) || (param_value->tensor_addr() == nullptr)) {
|
||||
param_value = nullptr;
|
||||
tensor_info = std::static_pointer_cast<tensor::Tensor>(param_node->default_param());
|
||||
if ((tensor_info == nullptr) || (tensor_info->Size() == 0) || (tensor_info->data_c() == nullptr)) {
|
||||
tensor_info = nullptr;
|
||||
continue;
|
||||
} else if (param_value->tensor_type() == mindspore::kNumberTypeInt8 ||
|
||||
param_value->tensor_type() == mindspore::kNumberTypeInt16) {
|
||||
} else if (tensor_info->data_type() == mindspore::kNumberTypeInt8 ||
|
||||
tensor_info->data_type() == mindspore::kNumberTypeInt16) {
|
||||
MS_LOG(INFO) << "the node: " << cnode->fullname_with_scope() << " input_i: " << i << "has been "
|
||||
<< " quantized";
|
||||
already_quant = true;
|
||||
break;
|
||||
} else if (param_value->tensor_type() != mindspore::kNumberTypeFloat32) {
|
||||
param_value = nullptr;
|
||||
} else if (tensor_info->data_type() != mindspore::kNumberTypeFloat32) {
|
||||
tensor_info = nullptr;
|
||||
continue;
|
||||
} else {
|
||||
index = i;
|
||||
|
@ -159,7 +160,7 @@ STATUS WeightQuantizer::DoMulQuantize(CNodePtr cnode) {
|
|||
return RET_OK;
|
||||
}
|
||||
|
||||
if (param_value == nullptr) {
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(WARNING) << cnode->fullname_with_scope() << " No valid input param node !";
|
||||
return RET_OK;
|
||||
}
|
||||
|
@ -172,11 +173,11 @@ STATUS WeightQuantizer::DoMulQuantize(CNodePtr cnode) {
|
|||
|
||||
auto status = RET_ERROR;
|
||||
if (type_id_ == kNumberTypeInt8) {
|
||||
status = QuantFilter<int8_t>(param_value, primitive, QuantType_WeightQuant, quant_max_, quant_min_, bit_num_, true,
|
||||
index - 1);
|
||||
status = QuantFilter<int8_t>(tensor_info, primitive, QuantType_WeightQuant, quant_max_, quant_min_, bit_num_, true,
|
||||
type_id_, index - 1);
|
||||
} else if (type_id_ == kNumberTypeInt16) {
|
||||
status = QuantFilter<int16_t>(param_value, primitive, QuantType_WeightQuant, quant_max_, quant_min_, bit_num_, true,
|
||||
index - 1);
|
||||
status = QuantFilter<int16_t>(tensor_info, primitive, QuantType_WeightQuant, quant_max_, quant_min_, bit_num_, true,
|
||||
type_id_, index - 1);
|
||||
}
|
||||
if (status == RET_CONTINUE) {
|
||||
return RET_OK;
|
||||
|
@ -184,7 +185,7 @@ STATUS WeightQuantizer::DoMulQuantize(CNodePtr cnode) {
|
|||
MS_LOG(ERROR) << "QuantFilter failed : " << status;
|
||||
return status;
|
||||
}
|
||||
status = SetAbstract(param_value, param_node, primitive);
|
||||
status = SetAbstract(tensor_info, param_node, primitive);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "SetAbstract failed : " << status;
|
||||
return RET_ERROR;
|
||||
|
@ -193,7 +194,7 @@ STATUS WeightQuantizer::DoMulQuantize(CNodePtr cnode) {
|
|||
return RET_OK;
|
||||
}
|
||||
|
||||
STATUS WeightQuantizer::DoLstmQuantize(CNodePtr cnode) {
|
||||
STATUS WeightQuantizer::DoLstmQuantize(const CNodePtr &cnode) {
|
||||
MS_ASSERT(cnode != nullptr);
|
||||
auto op_name = cnode->fullname_with_scope();
|
||||
|
||||
|
@ -226,32 +227,32 @@ STATUS WeightQuantizer::DoLstmQuantize(CNodePtr cnode) {
|
|||
return status;
|
||||
}
|
||||
|
||||
STATUS WeightQuantizer::DoGatherQuantize(CNodePtr cnode) {
|
||||
STATUS WeightQuantizer::DoGatherQuantize(const CNodePtr &cnode) {
|
||||
auto primitive = GetValueNode<PrimitivePtr>(cnode->input(0));
|
||||
MS_ASSERT(primitive != nullptr);
|
||||
|
||||
auto first_input = cnode->input(1);
|
||||
ParameterPtr param_node;
|
||||
ParamValueLitePtr param_value;
|
||||
GetLiteParameter(first_input, ¶m_node, ¶m_value);
|
||||
if (param_node == nullptr || param_value == nullptr || param_value->tensor_type() != TypeId::kNumberTypeFloat32) {
|
||||
tensor::TensorPtr tensor_info;
|
||||
GetLiteParameter(first_input, ¶m_node, &tensor_info);
|
||||
if (param_node == nullptr || tensor_info == nullptr || tensor_info->data_type() != TypeId::kNumberTypeFloat32) {
|
||||
MS_LOG(INFO) << "This Gather op " << cnode->fullname_with_scope() << " can not quant weight";
|
||||
return RET_OK;
|
||||
}
|
||||
|
||||
if (param_value->tensor_size() / 4 < quant_strategy_->m_weight_size_) {
|
||||
MS_LOG(INFO) << cnode->fullname_with_scope() << " param cnt: " << param_value->tensor_size() / 4 << " < "
|
||||
if (tensor_info->Size() / 4 < quant_strategy_->m_weight_size_) {
|
||||
MS_LOG(INFO) << cnode->fullname_with_scope() << " param cnt: " << tensor_info->Size() / 4 << " < "
|
||||
<< quant_strategy_->m_weight_size_;
|
||||
return RET_OK;
|
||||
}
|
||||
|
||||
auto status = RET_ERROR;
|
||||
if (type_id_ == kNumberTypeInt8) {
|
||||
status =
|
||||
QuantFilter<int8_t>(param_value, primitive, QuantType_WeightQuant, quant_max_, quant_min_, bit_num_, false, 0);
|
||||
status = QuantFilter<int8_t>(tensor_info, primitive, QuantType_WeightQuant, quant_max_, quant_min_, bit_num_, false,
|
||||
type_id_, 0);
|
||||
} else if (type_id_ == kNumberTypeInt16) {
|
||||
status =
|
||||
QuantFilter<int16_t>(param_value, primitive, QuantType_WeightQuant, quant_max_, quant_min_, bit_num_, false, 0);
|
||||
status = QuantFilter<int16_t>(tensor_info, primitive, QuantType_WeightQuant, quant_max_, quant_min_, bit_num_,
|
||||
false, type_id_, 0);
|
||||
}
|
||||
if (status == RET_CONTINUE) {
|
||||
return RET_OK;
|
||||
|
@ -259,7 +260,7 @@ STATUS WeightQuantizer::DoGatherQuantize(CNodePtr cnode) {
|
|||
MS_LOG(ERROR) << "QuantFilter failed : " << status;
|
||||
return status;
|
||||
}
|
||||
status = SetAbstract(param_value, param_node, primitive);
|
||||
status = SetAbstract(tensor_info, param_node, primitive);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "SetAbstract failed : " << status;
|
||||
return RET_ERROR;
|
||||
|
@ -272,28 +273,28 @@ STATUS WeightQuantizer::ProcessLstmWeightByIndex(const CNodePtr &cnode, const Pr
|
|||
auto op_name = cnode->fullname_with_scope();
|
||||
auto weight_i = cnode->input(index);
|
||||
ParameterPtr param_node;
|
||||
ParamValueLitePtr param_value;
|
||||
GetLiteParameter(weight_i, ¶m_node, ¶m_value);
|
||||
if (param_node == nullptr || param_value == nullptr) {
|
||||
|
||||
tensor::TensorPtr tensor_info;
|
||||
GetLiteParameter(weight_i, ¶m_node, &tensor_info);
|
||||
if (param_node == nullptr || tensor_info == nullptr) {
|
||||
MS_LOG(INFO) << "LSTM input index " << index << " is not weight";
|
||||
return RET_OK;
|
||||
}
|
||||
if (param_value->tensor_type() != TypeId::kNumberTypeFloat32) {
|
||||
MS_LOG(WARNING) << "param_value tensor type is: " << param_value->tensor_type() << " not quant";
|
||||
if (tensor_info->data_type() != TypeId::kNumberTypeFloat32) {
|
||||
MS_LOG(WARNING) << "tensor_info tensor type is: " << tensor_info->data_type() << " not quant";
|
||||
return RET_OK;
|
||||
}
|
||||
if (param_value->tensor_size() / 4 < quant_strategy_->m_weight_size_) {
|
||||
MS_LOG(INFO) << op_name << " weight_i cnt: " << param_value->tensor_size() / 4 << " < "
|
||||
<< quant_strategy_->m_weight_size_;
|
||||
if (tensor_info->Size() / 4 < quant_strategy_->m_weight_size_) {
|
||||
MS_LOG(INFO) << op_name << " weight_i cnt: " << tensor_info->Size() / 4 << " < " << quant_strategy_->m_weight_size_;
|
||||
return RET_OK;
|
||||
}
|
||||
auto status = RET_ERROR;
|
||||
if (type_id_ == kNumberTypeInt8) {
|
||||
status = QuantFilter<int8_t>(param_value, primitive, QuantType_WeightQuant, quant_max_, quant_min_, bit_num_, false,
|
||||
index - 1);
|
||||
status = QuantFilter<int8_t>(tensor_info, primitive, QuantType_WeightQuant, quant_max_, quant_min_, bit_num_, false,
|
||||
type_id_, index - 1);
|
||||
} else if (type_id_ == kNumberTypeInt16) {
|
||||
status = QuantFilter<int16_t>(param_value, primitive, QuantType_WeightQuant, quant_max_, quant_min_, bit_num_,
|
||||
false, index - 1);
|
||||
status = QuantFilter<int16_t>(tensor_info, primitive, QuantType_WeightQuant, quant_max_, quant_min_, bit_num_,
|
||||
false, type_id_, index - 1);
|
||||
}
|
||||
if (status == RET_CONTINUE) {
|
||||
return RET_OK;
|
||||
|
@ -301,7 +302,7 @@ STATUS WeightQuantizer::ProcessLstmWeightByIndex(const CNodePtr &cnode, const Pr
|
|||
MS_LOG(ERROR) << "QuantFilter failed : " << status;
|
||||
return status;
|
||||
}
|
||||
status = SetAbstract(param_value, param_node, primitive);
|
||||
status = SetAbstract(tensor_info, param_node, primitive);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "SetAbstract failed : " << status;
|
||||
return RET_ERROR;
|
||||
|
@ -378,7 +379,7 @@ float CompareOutputData(const std::unordered_map<std::string, mindspore::tensor:
|
|||
return total_mean_error / tensor_cnt;
|
||||
}
|
||||
|
||||
STATUS WeightQuantizer::RunFp32Graph(FuncGraphPtr func_graph) {
|
||||
STATUS WeightQuantizer::RunFp32Graph(const FuncGraphPtr &func_graph) {
|
||||
auto image_cnt = images_.at(0).size();
|
||||
if (!config_param_.input_shapes.empty()) {
|
||||
if (config_param_.input_shapes.size() != image_cnt) {
|
||||
|
@ -475,7 +476,7 @@ STATUS WeightQuantizer::CheckImageCnt() {
|
|||
return RET_OK;
|
||||
}
|
||||
STATUS WeightQuantizer::GetParamNodeAndValue(const std::shared_ptr<AnfNode> &input_node, const std::string &op_name,
|
||||
ParameterPtr *param_node, ParamValueLitePtr *param_value) {
|
||||
ParameterPtr *param_node, tensor::TensorPtr *tensor_info) {
|
||||
if (!input_node->isa<Parameter>()) {
|
||||
MS_LOG(WARNING) << op_name << " the second input is not parameter";
|
||||
return RET_CONTINUE;
|
||||
|
@ -485,30 +486,30 @@ STATUS WeightQuantizer::GetParamNodeAndValue(const std::shared_ptr<AnfNode> &inp
|
|||
MS_LOG(WARNING) << op_name << " the second input can not convert to parameter";
|
||||
return RET_CONTINUE;
|
||||
}
|
||||
*param_value = std::static_pointer_cast<ParamValueLite>((*param_node)->default_param());
|
||||
if (*param_value == nullptr) {
|
||||
*tensor_info = std::static_pointer_cast<tensor::Tensor>((*param_node)->default_param());
|
||||
if (*tensor_info == nullptr) {
|
||||
MS_LOG(WARNING) << op_name << " the second input can not convert to parameter";
|
||||
return RET_CONTINUE;
|
||||
}
|
||||
if ((*param_value)->tensor_type() != TypeId::kNumberTypeFloat32) {
|
||||
if ((*tensor_info)->data_type() != TypeId::kNumberTypeFloat32) {
|
||||
MS_LOG(WARNING) << op_name << " the second input type is not float";
|
||||
return RET_CONTINUE;
|
||||
}
|
||||
return RET_OK;
|
||||
}
|
||||
STATUS WeightQuantizer::TryQuant(const int &bit_num_t, const ParameterPtr ¶m_node,
|
||||
const ParamValueLitePtr ¶m_value, const PrimitivePtr &primitive) {
|
||||
const tensor::TensorPtr &tensor_info, const PrimitivePtr &primitive) {
|
||||
int status;
|
||||
type_id_ = TypeId::kNumberTypeInt8;
|
||||
int quant_max_t = (1 << (unsigned int)(bit_num_t - 1)) - 1;
|
||||
int quant_min_t = -(1 << (unsigned int)(bit_num_t - 1));
|
||||
|
||||
if (type_id_ == TypeId::kNumberTypeInt8) {
|
||||
status = QuantFilter<int8_t>(param_value, primitive, QuantType::QuantType_WeightQuant, quant_max_t, quant_min_t,
|
||||
bit_num_t, true);
|
||||
status = QuantFilter<int8_t>(tensor_info, primitive, QuantType::QuantType_WeightQuant, quant_max_t, quant_min_t,
|
||||
bit_num_t, true, type_id_);
|
||||
} else if (type_id_ == TypeId::kNumberTypeInt16) {
|
||||
status = QuantFilter<int16_t>(param_value, primitive, QuantType::QuantType_WeightQuant, quant_max_t, quant_min_t,
|
||||
bit_num_t, true);
|
||||
status = QuantFilter<int16_t>(tensor_info, primitive, QuantType::QuantType_WeightQuant, quant_max_t, quant_min_t,
|
||||
bit_num_t, true, type_id_);
|
||||
} else {
|
||||
MS_LOG(ERROR) << "unexpected type_id_: " << type_id_;
|
||||
return RET_ERROR;
|
||||
|
@ -519,7 +520,7 @@ STATUS WeightQuantizer::TryQuant(const int &bit_num_t, const ParameterPtr ¶m
|
|||
MS_LOG(ERROR) << "quant filter failed.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
status = SetAbstract(param_value, param_node, primitive);
|
||||
status = SetAbstract(tensor_info, param_node, primitive);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "SetAbstract failed : " << status;
|
||||
return RET_ERROR;
|
||||
|
@ -542,24 +543,24 @@ STATUS WeightQuantizer::DoQuantSearch(const FuncGraphPtr &func_graph) {
|
|||
if (quant_strategy_->CanConvOpQuantized(cnode) || quant_strategy_->CanMulOpQuantized(cnode)) {
|
||||
auto input_node = cnode->input(2);
|
||||
ParameterPtr param_node;
|
||||
ParamValueLitePtr param_value;
|
||||
status = GetParamNodeAndValue(input_node, op_name, ¶m_node, ¶m_value);
|
||||
tensor::TensorPtr tensor_info;
|
||||
status = GetParamNodeAndValue(input_node, op_name, ¶m_node, &tensor_info);
|
||||
if (status == RET_CONTINUE) {
|
||||
continue;
|
||||
}
|
||||
// copy origin data in case to recover
|
||||
auto *raw_data = static_cast<float *>(param_value->tensor_addr());
|
||||
auto elem_count = param_value->tensor_shape_size();
|
||||
auto *raw_data = static_cast<float *>(tensor_info->data_c());
|
||||
auto elem_count = tensor_info->DataSize();
|
||||
std::unique_ptr<float[]> origin_data(new (std::nothrow) float[elem_count]);
|
||||
auto ret = memcpy_s(origin_data.get(), sizeof(float) * elem_count, raw_data, param_value->tensor_size());
|
||||
auto ret = memcpy_s(origin_data.get(), sizeof(float) * elem_count, raw_data, tensor_info->Size());
|
||||
if (ret != EOK) {
|
||||
MS_LOG(ERROR) << "memcpy fail: "
|
||||
<< " dst size: " << sizeof(float) * elem_count << " src size: " << param_value->tensor_size();
|
||||
<< " dst size: " << sizeof(float) * elem_count << " src size: " << tensor_info->Size();
|
||||
return RET_ERROR;
|
||||
}
|
||||
// 1. try quant
|
||||
for (int bit_num_t = 2; bit_num_t <= 8; bit_num_t++) {
|
||||
status = TryQuant(bit_num_t, param_node, param_value, primitive);
|
||||
status = TryQuant(bit_num_t, param_node, tensor_info, primitive);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "TryQuant failed.";
|
||||
return RET_ERROR;
|
||||
|
@ -616,7 +617,8 @@ STATUS WeightQuantizer::DoQuantSearch(const FuncGraphPtr &func_graph) {
|
|||
MS_LOG(DEBUG) << "op: " << op_name << " intermediate bit: " << bit_num_t << " mean_error: " << mean_error
|
||||
<< " [recover]";
|
||||
// recover
|
||||
status = UpdateTensorDataAndSize(param_value, origin_data.get(), sizeof(float) * elem_count);
|
||||
status =
|
||||
UpdateTensorDataAndSize(tensor_info, origin_data.get(), sizeof(float) * elem_count, kNumberTypeFloat32);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "UpdateTensorDataAndSize fail";
|
||||
return RET_ERROR;
|
||||
|
@ -631,7 +633,7 @@ STATUS WeightQuantizer::DoQuantSearch(const FuncGraphPtr &func_graph) {
|
|||
return status;
|
||||
}
|
||||
|
||||
STATUS WeightQuantizer::DoMixedQuant(FuncGraphPtr func_graph) {
|
||||
STATUS WeightQuantizer::DoMixedQuant(const FuncGraphPtr &func_graph) {
|
||||
// 0.2 Parse input calib files
|
||||
auto status = CollectCalibInputs(config_param_.image_paths, config_param_.batch_count, &images_);
|
||||
if (status != RET_OK) {
|
||||
|
@ -669,7 +671,7 @@ STATUS WeightQuantizer::DoMixedQuant(FuncGraphPtr func_graph) {
|
|||
return RET_OK;
|
||||
}
|
||||
|
||||
STATUS WeightQuantizer::DoFixedQuant(FuncGraphPtr func_graph) {
|
||||
STATUS WeightQuantizer::DoFixedQuant(const FuncGraphPtr &func_graph) {
|
||||
MS_ASSERT(func_graph != nullptr);
|
||||
for (auto &cnode : func_graph->GetOrderedCnodes()) {
|
||||
auto primitive = GetValueNode<std::shared_ptr<ops::PrimitiveC>>(cnode->input(0));
|
||||
|
|
|
@ -41,10 +41,10 @@ class WeightQuantizer : public Quantizer {
|
|||
~WeightQuantizer();
|
||||
|
||||
STATUS DoQuantize(FuncGraphPtr func_graph) override;
|
||||
STATUS DoConvQuantize(CNodePtr);
|
||||
STATUS DoMulQuantize(CNodePtr);
|
||||
STATUS DoLstmQuantize(CNodePtr cnode);
|
||||
STATUS DoGatherQuantize(CNodePtr cnode);
|
||||
STATUS DoConvQuantize(const CNodePtr &);
|
||||
STATUS DoMulQuantize(const CNodePtr &);
|
||||
STATUS DoLstmQuantize(const CNodePtr &cnode);
|
||||
STATUS DoGatherQuantize(const CNodePtr &cnode);
|
||||
|
||||
STATUS ProcessLstmWeightByIndex(const CNodePtr &cnode, const PrimitivePtr &primitive, const int &index);
|
||||
|
||||
|
@ -61,16 +61,17 @@ class WeightQuantizer : public Quantizer {
|
|||
std::vector<std::vector<std::string>> images_; // multi_input, [[mode_input_0], [model_input_1]...]
|
||||
std::vector<std::unordered_map<std::string, mindspore::tensor::MSTensor *>> fp32_output_tensors_;
|
||||
|
||||
STATUS DoMixedQuant(FuncGraphPtr);
|
||||
STATUS SetAbstract(ParamValueLitePtr param_value, ParameterPtr param_node, const PrimitivePtr &primitive);
|
||||
STATUS DoFixedQuant(FuncGraphPtr);
|
||||
STATUS RunFp32Graph(FuncGraphPtr);
|
||||
STATUS DoMixedQuant(const FuncGraphPtr &);
|
||||
STATUS SetAbstract(const tensor::TensorPtr &tensor_info, const ParameterPtr ¶m_node,
|
||||
const PrimitivePtr &primitive);
|
||||
STATUS DoFixedQuant(const FuncGraphPtr &);
|
||||
STATUS RunFp32Graph(const FuncGraphPtr &);
|
||||
|
||||
STATUS DoMixedQuantize(const FuncGraphPtr &func_graph);
|
||||
STATUS CheckImageCnt();
|
||||
STATUS GetParamNodeAndValue(const std::shared_ptr<AnfNode> &input_node, const std::string &op_name,
|
||||
ParameterPtr *param_node, ParamValueLitePtr *param_value);
|
||||
STATUS TryQuant(const int &bit_num_t, const ParameterPtr ¶m_node, const ParamValueLitePtr ¶m_value,
|
||||
ParameterPtr *param_node, tensor::TensorPtr *tensor_info);
|
||||
STATUS TryQuant(const int &bit_num_t, const ParameterPtr ¶m_node, const tensor::TensorPtr &tensor_info,
|
||||
const PrimitivePtr &primitive);
|
||||
STATUS DoQuantSearch(const FuncGraphPtr &func_graph);
|
||||
};
|
||||
|
|
|
@ -23,6 +23,7 @@
|
|||
#include "Eigen/Core"
|
||||
#include "ops/fusion/conv2d_fusion.h"
|
||||
#include "src/common/common.h"
|
||||
#include "tools/common/tensor_util.h"
|
||||
#include "frontend/operator/ops.h"
|
||||
#include "backend/optimizer/common/helper.h"
|
||||
|
||||
|
@ -433,33 +434,31 @@ int CheckLeastInputSize(const CNodePtr &node, const int size) {
|
|||
}
|
||||
|
||||
ParameterPtr AddNewBiasNode(float *bias_data, const FuncGraphPtr &func_graph, int kernel_num,
|
||||
const ParamValueLitePtr &weight_tensor) {
|
||||
const tensor::TensorPtr &weight_tensor) {
|
||||
auto bias_parameter = func_graph->add_parameter();
|
||||
MS_ASSERT(bias_parameter != nullptr);
|
||||
std::vector<int> shape = {kernel_num};
|
||||
std::vector<int64_t> shape_vector;
|
||||
(void)std::transform(shape.begin(), shape.end(), std::back_inserter(shape_vector),
|
||||
[](const int32_t &value) { return static_cast<int64_t>(value); });
|
||||
auto abstract_tensor =
|
||||
std::make_shared<abstract::AbstractTensor>(TypeIdToType(weight_tensor->tensor_type()), shape_vector);
|
||||
bias_parameter->set_abstract(abstract_tensor);
|
||||
std::vector<int64_t> shape_vector = {kernel_num};
|
||||
auto tensor_info = lite::CreateTensorInfo(bias_data, kernel_num * sizeof(float) / sizeof(uint8_t), shape_vector,
|
||||
weight_tensor->data_type());
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "create tensor info failed.";
|
||||
return nullptr;
|
||||
}
|
||||
auto status = lite::InitParameterFromTensorInfo(bias_parameter, tensor_info);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "init parameter from tensor info failed";
|
||||
return nullptr;
|
||||
}
|
||||
|
||||
ParamValueLitePtr param_value = std::make_shared<ParamValueLite>();
|
||||
MS_ASSERT(param_value != nullptr);
|
||||
param_value->SetTensorData(bias_data, kernel_num * sizeof(float) / sizeof(uint8_t));
|
||||
param_value->set_format(weight_tensor->format());
|
||||
param_value->set_tensor_type(weight_tensor->tensor_type());
|
||||
param_value->set_tensor_shape(shape);
|
||||
bias_parameter->set_default_param(param_value);
|
||||
return bias_parameter;
|
||||
}
|
||||
|
||||
ParamValueLitePtr GetLiteParamValue(const AnfNodePtr &node) {
|
||||
tensor::TensorPtr GetTensorInfo(const AnfNodePtr &node) {
|
||||
MS_ASSERT(node != nullptr);
|
||||
if (!utils::isa<ParameterPtr>(node)) {
|
||||
if (utils::isa<ValueNodePtr>(node)) {
|
||||
auto valueNode = node->cast<ValueNodePtr>();
|
||||
auto value = std::dynamic_pointer_cast<ParamValueLite>(valueNode->value());
|
||||
auto value = std::dynamic_pointer_cast<tensor::Tensor>(valueNode->value());
|
||||
if (value != nullptr) {
|
||||
return value;
|
||||
}
|
||||
|
@ -469,8 +468,8 @@ ParamValueLitePtr GetLiteParamValue(const AnfNodePtr &node) {
|
|||
}
|
||||
auto param = node->cast<ParameterPtr>();
|
||||
MS_ASSERT(param != nullptr);
|
||||
auto param_value = std::dynamic_pointer_cast<ParamValueLite>(param->default_param());
|
||||
return param_value;
|
||||
auto tensor_info = std::dynamic_pointer_cast<tensor::Tensor>(param->default_param());
|
||||
return tensor_info;
|
||||
}
|
||||
|
||||
AbstractBasePtr GetCNodeInputAbstract(const CNodePtr &cnode, size_t index) {
|
||||
|
@ -526,11 +525,11 @@ bool IsParamNode(const BaseRef &n) {
|
|||
return false;
|
||||
}
|
||||
auto param = utils::cast<ParameterPtr>(n)->default_param();
|
||||
auto tensor = std::dynamic_pointer_cast<ParamValueLite>(param);
|
||||
auto tensor = std::dynamic_pointer_cast<tensor::Tensor>(param);
|
||||
if (tensor == nullptr) {
|
||||
return false;
|
||||
}
|
||||
return tensor->tensor_addr() != nullptr;
|
||||
return tensor->data_c() != nullptr;
|
||||
}
|
||||
|
||||
bool IsConvNode(const BaseRef &n) {
|
||||
|
@ -717,8 +716,8 @@ std::shared_ptr<std::vector<std::pair<AnfNodePtr, int>>> GetRealNodeUsedListByOu
|
|||
}
|
||||
return output_node_list;
|
||||
}
|
||||
STATUS GetFilterDim(const std::vector<int32_t> &oriDims, kTransFilterType type, int32_t *filterK, int32_t *filterC,
|
||||
int32_t *filterH, int32_t *filterW) {
|
||||
STATUS GetFilterDim(const std::vector<int64_t> &oriDims, kTransFilterType type, int64_t *filterK, int64_t *filterC,
|
||||
int64_t *filterH, int64_t *filterW) {
|
||||
MS_ASSERT(oriDims.size() == 4);
|
||||
std::unordered_map<kTransFilterType, int> maps = {
|
||||
{kKCHW2HWCK, 1}, {kKCHW2HWKC, 1}, {kKCHW2KHWC, 1}, {kKCHW2CKHW, 1}, {kCKHW2HWCK, 2},
|
||||
|
@ -780,7 +779,7 @@ STATUS GetFilterDim(const std::vector<int32_t> &oriDims, kTransFilterType type,
|
|||
return RET_OK;
|
||||
}
|
||||
|
||||
STATUS SetFilterDim(const ParamValueLitePtr &tensor, kTransFilterType type, int32_t filterK, int32_t filterC,
|
||||
STATUS SetFilterDim(const tensor::TensorPtr &tensor, kTransFilterType type, int32_t filterK, int32_t filterC,
|
||||
int32_t filterH, int32_t filterW) {
|
||||
MS_ASSERT(tensor != nullptr);
|
||||
std::unordered_map<kTransFilterType, int> maps = {
|
||||
|
@ -796,22 +795,22 @@ STATUS SetFilterDim(const ParamValueLitePtr &tensor, kTransFilterType type, int3
|
|||
|
||||
switch (maps.find(type)->second) {
|
||||
case 1:
|
||||
tensor->set_tensor_shape({filterH, filterW, filterC, filterK});
|
||||
tensor->set_shape({filterH, filterW, filterC, filterK});
|
||||
break;
|
||||
case 2:
|
||||
tensor->set_tensor_shape({filterH, filterW, filterK, filterC});
|
||||
tensor->set_shape({filterH, filterW, filterK, filterC});
|
||||
break;
|
||||
case 3:
|
||||
tensor->set_tensor_shape({filterK, filterC, filterH, filterW});
|
||||
tensor->set_shape({filterK, filterC, filterH, filterW});
|
||||
break;
|
||||
case 4:
|
||||
tensor->set_tensor_shape({filterC, filterK, filterH, filterW});
|
||||
tensor->set_shape({filterC, filterK, filterH, filterW});
|
||||
break;
|
||||
case 5:
|
||||
tensor->set_tensor_shape({filterC, filterH, filterW, filterK});
|
||||
tensor->set_shape({filterC, filterH, filterW, filterK});
|
||||
break;
|
||||
case 6:
|
||||
tensor->set_tensor_shape({filterK, filterH, filterW, filterC});
|
||||
tensor->set_shape({filterK, filterH, filterW, filterC});
|
||||
break;
|
||||
default:
|
||||
MS_LOG(ERROR) << "Unsupported transFilterType: " << type;
|
||||
|
@ -981,7 +980,7 @@ void TransFilterDataKHWC2CHWK(kTransFilterType type, int32_t filterK, int32_t fi
|
|||
}
|
||||
|
||||
template <typename T>
|
||||
static STATUS TransFilterData(const ParamValueLitePtr &tensor, kTransFilterType type, int32_t filterK, int32_t filterC,
|
||||
static STATUS TransFilterData(const tensor::TensorPtr &tensor, kTransFilterType type, int32_t filterK, int32_t filterC,
|
||||
int32_t filterH, int32_t filterW) {
|
||||
MS_ASSERT(tensor != nullptr);
|
||||
int count = filterH * filterW * filterC * filterK;
|
||||
|
@ -995,7 +994,7 @@ static STATUS TransFilterData(const ParamValueLitePtr &tensor, kTransFilterType
|
|||
return RET_ERROR;
|
||||
}
|
||||
|
||||
void *originWeightData = tensor->tensor_addr();
|
||||
void *originWeightData = tensor->data_c();
|
||||
T *weightData = static_cast<T *>(originWeightData);
|
||||
|
||||
if (weightData == nullptr) {
|
||||
|
@ -1046,7 +1045,7 @@ static STATUS TransFilterData(const ParamValueLitePtr &tensor, kTransFilterType
|
|||
}
|
||||
}
|
||||
|
||||
auto ret = ::memcpy_s(tensor->tensor_addr(), count * sizeof(T), buf.get(), count * sizeof(T));
|
||||
auto ret = ::memcpy_s(tensor->data_c(), count * sizeof(T), buf.get(), count * sizeof(T));
|
||||
if (ret != EOK) {
|
||||
MS_LOG(ERROR) << "memcpy_s failed: " << ret;
|
||||
return RET_ERROR;
|
||||
|
@ -1055,18 +1054,18 @@ static STATUS TransFilterData(const ParamValueLitePtr &tensor, kTransFilterType
|
|||
}
|
||||
|
||||
template <typename T>
|
||||
static STATUS TransFilterFormat(const ParamValueLitePtr &tensor, kTransFilterType type) {
|
||||
static STATUS TransFilterFormat(const tensor::TensorPtr &tensor, kTransFilterType type) {
|
||||
MS_ASSERT(tensor != nullptr);
|
||||
auto oriDims = tensor->tensor_shape();
|
||||
auto oriDims = tensor->shape_c();
|
||||
if (oriDims.size() != (size_t)lite::DIM_DEFAULT_SIZE) {
|
||||
MS_LOG(ERROR) << "Filter dim-num is not supported, dim-num: " << oriDims.size();
|
||||
return lite::RET_ERROR;
|
||||
}
|
||||
|
||||
int32_t filterH;
|
||||
int32_t filterW;
|
||||
int32_t filterC;
|
||||
int32_t filterK;
|
||||
int64_t filterH;
|
||||
int64_t filterW;
|
||||
int64_t filterC;
|
||||
int64_t filterK;
|
||||
auto status = GetFilterDim(oriDims, type, &filterK, &filterC, &filterH, &filterW);
|
||||
if (status != lite::RET_OK) {
|
||||
MS_LOG(ERROR) << "GetFilterDim failed: " << status;
|
||||
|
@ -1086,7 +1085,7 @@ static STATUS TransFilterFormat(const ParamValueLitePtr &tensor, kTransFilterTyp
|
|||
return lite::RET_OK;
|
||||
}
|
||||
|
||||
STATUS TransFilterFormatWithType(const ParamValueLitePtr &tensor, TypeId data_type,
|
||||
STATUS TransFilterFormatWithType(const tensor::TensorPtr &tensor, TypeId data_type,
|
||||
kTransFilterType trans_filter_type) {
|
||||
if (data_type == kNumberTypeFloat32) {
|
||||
return TransFilterFormat<float>(tensor, trans_filter_type);
|
||||
|
@ -1102,17 +1101,16 @@ STATUS TransFilterFormatWithType(const ParamValueLitePtr &tensor, TypeId data_ty
|
|||
}
|
||||
}
|
||||
|
||||
STATUS TransFilterFormat(const ParamValueLitePtr &tensor, schema::Format dst_format) {
|
||||
STATUS TransFilterFormat(const tensor::TensorPtr &tensor, schema::Format src_format, schema::Format dst_format) {
|
||||
if (tensor == nullptr) {
|
||||
return lite::RET_NULL_PTR;
|
||||
}
|
||||
auto ori_dims = tensor->tensor_shape();
|
||||
auto ori_dims = tensor->shape_c();
|
||||
if (ori_dims.size() != (size_t)lite::DIM_DEFAULT_SIZE) {
|
||||
MS_LOG(ERROR) << "Filter dim-num is not supported, dim-num: " << ori_dims.size();
|
||||
return lite::RET_ERROR;
|
||||
}
|
||||
auto src_format = tensor->format();
|
||||
auto data_type = tensor->tensor_type();
|
||||
auto data_type = tensor->data_type();
|
||||
lite::STATUS status;
|
||||
std::unordered_map<schema::Format, kTransFilterType> khwc_trans_maps = {
|
||||
{schema::Format::Format_KCHW, kKCHW2KHWC}, {schema::Format::Format_CKHW, kCKHW2KHWC},
|
||||
|
@ -1195,42 +1193,42 @@ STATUS TransFilterFormat(const ParamValueLitePtr &tensor, schema::Format dst_for
|
|||
}
|
||||
|
||||
ParameterPtr BuildParameterNode(const FuncGraphPtr &func_graph, const AnfNodePtr &node,
|
||||
const ParamValueLitePtr ¶m_value) {
|
||||
const tensor::TensorPtr &tensor_info) {
|
||||
MS_ASSERT(func_graph != nullptr);
|
||||
MS_ASSERT(cnode != nullptr);
|
||||
MS_ASSERT(param_value != nullptr);
|
||||
auto param_node = func_graph->add_parameter();
|
||||
auto shape = param_value->tensor_shape();
|
||||
auto shape = tensor_info->shape();
|
||||
std::vector<int64_t> shape_vector;
|
||||
std::transform(shape.begin(), shape.end(), std::back_inserter(shape_vector),
|
||||
[](const int &val) { return static_cast<int64_t>(val); });
|
||||
auto data_type = param_value->tensor_type() == kNumberTypeInt64 ? kNumberTypeInt32 : param_value->tensor_type();
|
||||
auto abstract_tensor = std::make_shared<abstract::AbstractTensor>(TypeIdToType(data_type), shape_vector);
|
||||
param_node->set_abstract(abstract_tensor);
|
||||
auto data_type = tensor_info->data_type() == kNumberTypeInt64 ? kNumberTypeInt32 : tensor_info->data_type();
|
||||
if (utils::isa<CNodePtr>(node)) {
|
||||
param_node->set_name(node->cast<CNodePtr>()->fullname_with_scope());
|
||||
} else if (utils::isa<ParameterPtr>(node)) {
|
||||
param_node->set_name(node->cast<ParameterPtr>()->name());
|
||||
}
|
||||
ParamValueLitePtr param_value_new = std::make_shared<ParamValueLite>();
|
||||
param_value_new->set_format(param_value->format());
|
||||
param_value_new->set_tensor_shape(shape);
|
||||
auto tensor_info_new = std::make_shared<tensor::Tensor>(data_type, shape_vector);
|
||||
if (tensor_info_new == nullptr) {
|
||||
MS_LOG(ERROR) << "new tensor::Tensor failed.";
|
||||
return nullptr;
|
||||
}
|
||||
size_t data_count = std::accumulate(shape.begin(), shape.end(), 1, std::multiplies<int>());
|
||||
if (param_value->tensor_size() == 0) {
|
||||
if (param_value->tensor_type() == kNumberTypeInt64) {
|
||||
param_value_new->set_tensor_type(kNumberTypeInt32);
|
||||
if (tensor_info->Size() == 0) {
|
||||
auto status = lite::InitParameterFromTensorInfo(param_node, tensor_info_new);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "init parameter from tensor info failed";
|
||||
return nullptr;
|
||||
}
|
||||
param_node->set_default_param(param_value_new);
|
||||
return param_node;
|
||||
}
|
||||
if (param_value->tensor_type() == kNumberTypeInt64) {
|
||||
param_value_new->set_tensor_type(kNumberTypeInt32);
|
||||
auto *tensor_data = new (std::nothrow) int[data_count];
|
||||
if (tensor_info->data_type() == kNumberTypeInt64) {
|
||||
auto *tensor_data = reinterpret_cast<int *>(tensor_info_new->data_c());
|
||||
if (tensor_data == nullptr) {
|
||||
MS_LOG(ERROR) << "new data failed";
|
||||
return nullptr;
|
||||
}
|
||||
auto *origin_data = reinterpret_cast<int64_t *>(param_value->tensor_addr());
|
||||
auto *origin_data = reinterpret_cast<int64_t *>(tensor_info->data_c());
|
||||
for (size_t i = 0; i < data_count; ++i) {
|
||||
if (origin_data[i] > static_cast<int64_t>(INT32_MAX) || origin_data[i] < static_cast<int64_t>(INT32_MIN)) {
|
||||
MS_LOG(WARNING) << "int64 data " << origin_data[i] << "too big to fit into int32";
|
||||
|
@ -1239,23 +1237,24 @@ ParameterPtr BuildParameterNode(const FuncGraphPtr &func_graph, const AnfNodePtr
|
|||
tensor_data[i] = static_cast<int>(origin_data[i]);
|
||||
}
|
||||
}
|
||||
param_value_new->SetTensorData(tensor_data, data_count * sizeof(int32_t));
|
||||
} else {
|
||||
param_value_new->set_tensor_type(param_value->tensor_type());
|
||||
char *tensor_data = new (std::nothrow) char[param_value->tensor_size()];
|
||||
tensor_info_new->set_data_type(tensor_info->data_type());
|
||||
auto *tensor_data = reinterpret_cast<char *>(tensor_info_new->data_c());
|
||||
if (tensor_data == nullptr) {
|
||||
MS_LOG(ERROR) << "new data failed";
|
||||
return nullptr;
|
||||
}
|
||||
if (memcpy_s(tensor_data, param_value->tensor_size(), param_value->tensor_addr(), param_value->tensor_size()) !=
|
||||
lite::RET_OK) {
|
||||
if (memcpy_s(tensor_data, tensor_info->Size(), tensor_info->data_c(), tensor_info->Size()) != lite::RET_OK) {
|
||||
MS_LOG(ERROR) << "memcpy data failed.";
|
||||
delete[] tensor_data;
|
||||
return nullptr;
|
||||
}
|
||||
param_value_new->SetTensorData(tensor_data, param_value->tensor_size());
|
||||
}
|
||||
param_node->set_default_param(param_value_new);
|
||||
auto status = lite::InitParameterFromTensorInfo(param_node, tensor_info_new);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "init parameter from tensor info failed";
|
||||
return nullptr;
|
||||
}
|
||||
param_node->set_default_param(tensor_info_new);
|
||||
return param_node;
|
||||
}
|
||||
|
||||
|
@ -1264,21 +1263,19 @@ ParameterPtr BuildIntValueParameterNode(const FuncGraphPtr &func_graph, const in
|
|||
MS_ASSERT(func_graph != nullptr);
|
||||
MS_ASSERT(data.size() != 0);
|
||||
auto param_node = func_graph->add_parameter();
|
||||
|
||||
auto type_ptr = TypeIdToType(kNumberTypeInt32);
|
||||
auto abstract_tensor = std::make_shared<abstract::AbstractTensor>(type_ptr);
|
||||
param_node->set_abstract(abstract_tensor);
|
||||
param_node->set_name(node_name);
|
||||
|
||||
ParamValueLitePtr param_value = std::make_shared<ParamValueLite>();
|
||||
MS_ASSERT(param_value != nullptr);
|
||||
param_value->set_tensor_shape({1});
|
||||
param_value->set_tensor_type(kNumberTypeInt32);
|
||||
auto tensor_info = lite::CreateTensorInfo(&data, sizeof(int32_t), {1}, kNumberTypeInt32);
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "Create tensor info failed";
|
||||
return nullptr;
|
||||
}
|
||||
|
||||
char *default_data = new (std::nothrow) char[sizeof(int32_t)];
|
||||
*(reinterpret_cast<int32_t *>(default_data)) = data;
|
||||
param_value->SetTensorData(default_data, sizeof(int32_t));
|
||||
param_node->set_default_param(param_value);
|
||||
auto status = lite::InitParameterFromTensorInfo(param_node, tensor_info);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "init parameter from tensor info failed";
|
||||
return nullptr;
|
||||
}
|
||||
return param_node;
|
||||
}
|
||||
|
||||
|
@ -1287,29 +1284,21 @@ ParameterPtr BuildIntVecParameterNode(const FuncGraphPtr &func_graph, const std:
|
|||
MS_ASSERT(func_graph != nullptr);
|
||||
MS_ASSERT(data.size() != 0);
|
||||
auto param_node = func_graph->add_parameter();
|
||||
|
||||
auto type_ptr = TypeIdToType(kNumberTypeInt32);
|
||||
std::vector<int64_t> shape_vector{static_cast<int64_t>(data.size())};
|
||||
auto abstract_tensor = std::make_shared<abstract::AbstractTensor>(type_ptr, shape_vector);
|
||||
param_node->set_abstract(abstract_tensor);
|
||||
param_node->set_name(node_name);
|
||||
|
||||
ParamValueLitePtr param_value = std::make_shared<ParamValueLite>();
|
||||
MS_ASSERT(param_value != nullptr);
|
||||
std::vector<int32_t> shape{static_cast<int32_t>(data.size())};
|
||||
param_value->set_tensor_shape(shape);
|
||||
param_value->set_tensor_type(kNumberTypeInt32);
|
||||
|
||||
if (!data.empty()) {
|
||||
char *default_data = new (std::nothrow) char[data.size() * sizeof(int32_t)];
|
||||
if (memcpy_s(default_data, data.size() * sizeof(int32_t), data.data(), data.size() * sizeof(int32_t)) != EOK) {
|
||||
MS_LOG(ERROR) << "memcpy data failed.";
|
||||
delete[] default_data;
|
||||
return nullptr;
|
||||
}
|
||||
param_value->SetTensorData(default_data, data.size() * sizeof(int32_t));
|
||||
std::vector<int64_t> shape_vector{static_cast<int64_t>(data.size())};
|
||||
auto tensor_info = lite::CreateTensorInfo(data.data(), data.size() * sizeof(int32_t), shape_vector, kNumberTypeInt32);
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "Create tensor info failed";
|
||||
return nullptr;
|
||||
}
|
||||
param_node->set_default_param(param_value);
|
||||
|
||||
auto status = lite::InitParameterFromTensorInfo(param_node, tensor_info);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "init parameter from tensor info failed";
|
||||
return nullptr;
|
||||
}
|
||||
|
||||
return param_node;
|
||||
}
|
||||
|
||||
|
@ -1318,39 +1307,28 @@ ParameterPtr BuildIntVec2DParameterNode(const FuncGraphPtr &func_graph, const st
|
|||
MS_ASSERT(func_graph != nullptr);
|
||||
MS_ASSERT(data.size() != 0);
|
||||
auto param_node = func_graph->add_parameter();
|
||||
param_node->set_name(node_name);
|
||||
|
||||
auto type_ptr = TypeIdToType(kNumberTypeInt32);
|
||||
std::vector<int64_t> shape_vector;
|
||||
shape_vector.push_back(data.size());
|
||||
shape_vector.push_back(2);
|
||||
|
||||
auto abstract_tensor = std::make_shared<abstract::AbstractTensor>(type_ptr, shape_vector);
|
||||
param_node->set_abstract(abstract_tensor);
|
||||
param_node->set_name(node_name);
|
||||
|
||||
ParamValueLitePtr param_value = std::make_shared<ParamValueLite>();
|
||||
|
||||
MS_ASSERT(param_value != nullptr);
|
||||
std::vector<int32_t> shape;
|
||||
shape.push_back(data.size());
|
||||
shape.push_back(2);
|
||||
param_value->set_tensor_shape(shape);
|
||||
param_value->set_tensor_type(kNumberTypeInt32);
|
||||
|
||||
std::vector<int32_t> data_1d;
|
||||
for (auto pair : data) {
|
||||
data_1d.insert(data_1d.end(), pair.begin(), pair.end());
|
||||
}
|
||||
|
||||
auto size = data_1d.size() * sizeof(int32_t);
|
||||
char *default_data = new (std::nothrow) char[size];
|
||||
if (memcpy_s(default_data, size, data_1d.data(), size) != EOK) {
|
||||
MS_LOG(ERROR) << "memcpy data failed.";
|
||||
delete[] default_data;
|
||||
auto tensor_info = lite::CreateTensorInfo(data_1d.data(), size, shape_vector, kNumberTypeInt32);
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "Create tensor info failed";
|
||||
return nullptr;
|
||||
}
|
||||
auto status = lite::InitParameterFromTensorInfo(param_node, tensor_info);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "init parameter from tensor info failed";
|
||||
return nullptr;
|
||||
}
|
||||
param_value->SetTensorData(default_data, size);
|
||||
param_node->set_default_param(param_value);
|
||||
return param_node;
|
||||
}
|
||||
|
||||
|
@ -1359,26 +1337,18 @@ ParameterPtr BuildFloatValueParameterNode(const FuncGraphPtr &func_graph, const
|
|||
MS_ASSERT(func_graph != nullptr);
|
||||
MS_ASSERT(data.size() != 0);
|
||||
auto param_node = func_graph->add_parameter();
|
||||
|
||||
auto type_ptr = TypeIdToType(kNumberTypeFloat32);
|
||||
std::vector<int64_t> shape_vector = {1};
|
||||
auto abstract_tensor = std::make_shared<abstract::AbstractTensor>(type_ptr, shape_vector);
|
||||
param_node->set_abstract(abstract_tensor);
|
||||
param_node->set_name(node_name);
|
||||
|
||||
ParamValueLitePtr param_value = std::make_shared<ParamValueLite>();
|
||||
MS_ASSERT(param_value != nullptr);
|
||||
param_value->set_tensor_shape({1});
|
||||
param_value->set_tensor_type(kNumberTypeFloat32);
|
||||
|
||||
char *default_data = new (std::nothrow) char[sizeof(float)];
|
||||
if (memcpy_s(default_data, sizeof(float), &data, sizeof(float)) != EOK) {
|
||||
MS_LOG(ERROR) << "memcpy data failed.";
|
||||
delete[] default_data;
|
||||
auto tensor_info = lite::CreateTensorInfo(&data, sizeof(float), {1}, kNumberTypeFloat32);
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "Create tensor info failed";
|
||||
return nullptr;
|
||||
}
|
||||
auto status = lite::InitParameterFromTensorInfo(param_node, tensor_info);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "init parameter from tensor info failed";
|
||||
return nullptr;
|
||||
}
|
||||
param_value->SetTensorData(default_data, sizeof(float));
|
||||
param_node->set_default_param(param_value);
|
||||
return param_node;
|
||||
}
|
||||
} // namespace opt
|
||||
|
|
|
@ -26,7 +26,6 @@
|
|||
#include "src/common/utils.h"
|
||||
#include "backend/optimizer/common/pattern_engine.h"
|
||||
#include "schema/inner/model_generated.h"
|
||||
#include "src/param_value_lite.h"
|
||||
#include "tools/converter/converter_context.h"
|
||||
|
||||
using PrimitiveCPtr = std::shared_ptr<mindspore::ops::PrimitiveC>;
|
||||
|
@ -39,6 +38,7 @@ inline const PrimitivePtr kPrimDivFusion = std::make_shared<Primitive>("DivFusio
|
|||
inline const PrimitivePtr kPrimErf = std::make_shared<Primitive>("Erf");
|
||||
inline const PrimitivePtr kPrimMakeTupleV2 = std::make_shared<Primitive>("make_tuple");
|
||||
inline const PrimitivePtr kPrimIdentity = std::make_shared<Primitive>("Identity");
|
||||
constexpr auto kWeightFormat = "weight_format";
|
||||
std::vector<int> CastToInt(const ValuePtr &value);
|
||||
|
||||
std::vector<std::vector<int>> CastToVec2DInt(const ValuePtr &value);
|
||||
|
@ -66,7 +66,7 @@ int CheckIfNodeIsParam(const AnfNodePtr &node);
|
|||
int CheckLeastInputSize(const CNodePtr &node, int size);
|
||||
|
||||
ParameterPtr AddNewBiasNode(float *bias_data, const FuncGraphPtr &func_graph, int kernel_num,
|
||||
const ParamValueLitePtr &weight_tensor);
|
||||
const tensor::TensorPtr &weight_tensor);
|
||||
|
||||
bool IsParamNode(const BaseRef &n);
|
||||
|
||||
|
@ -88,7 +88,7 @@ bool IsMultiOutputTensors(const FuncGraphPtr &graph, const AnfNodePtr &node);
|
|||
|
||||
size_t GetTupleGetItemOutIndex(const CNodePtr &tuple_get_item);
|
||||
|
||||
ParamValueLitePtr GetLiteParamValue(const AnfNodePtr &node);
|
||||
tensor::TensorPtr GetTensorInfo(const AnfNodePtr &node);
|
||||
|
||||
AbstractBasePtr GetCNodeInputAbstract(const CNodePtr &cnode, size_t index);
|
||||
|
||||
|
@ -118,23 +118,23 @@ enum kTransFilterType {
|
|||
kHWKC2KHWC
|
||||
};
|
||||
|
||||
STATUS GetFilterDim(const std::vector<int32_t> &oriDims, kTransFilterType type, int32_t *filterK, int32_t *filterC,
|
||||
int32_t *filterH, int32_t *filterW);
|
||||
STATUS GetFilterDim(const std::vector<int64_t> &oriDims, kTransFilterType type, int64_t *filterK, int64_t *filterC,
|
||||
int64_t *filterH, int64_t *filterW);
|
||||
|
||||
STATUS SetFilterDim(const ParamValueLitePtr &tensor, kTransFilterType type, int32_t filterK, int32_t filterC,
|
||||
STATUS SetFilterDim(const tensor::TensorPtr &tensor, kTransFilterType type, int32_t filterK, int32_t filterC,
|
||||
int32_t filterH, int32_t filterW);
|
||||
|
||||
template <typename T>
|
||||
static STATUS TransFilterData(const ParamValueLitePtr &tensor, kTransFilterType type, int32_t filterK, int32_t filterC,
|
||||
static STATUS TransFilterData(const tensor::TensorPtr &tensor, kTransFilterType type, int32_t filterK, int32_t filterC,
|
||||
int32_t filterH, int32_t filterW);
|
||||
|
||||
template <typename T>
|
||||
static lite::STATUS TransFilterFormat(const ParamValueLitePtr &tensor, kTransFilterType type);
|
||||
static lite::STATUS TransFilterFormat(const tensor::TensorPtr &tensor, kTransFilterType type);
|
||||
|
||||
STATUS TransFilterFormat(const ParamValueLitePtr &tensor, schema::Format dst_format);
|
||||
STATUS TransFilterFormat(const tensor::TensorPtr &tensor, schema::Format src_format, schema::Format dst_format);
|
||||
|
||||
ParameterPtr BuildParameterNode(const FuncGraphPtr &func_graph, const AnfNodePtr &node,
|
||||
const ParamValueLitePtr ¶m_value);
|
||||
const tensor::TensorPtr &tensor_info);
|
||||
|
||||
ParameterPtr BuildIntValueParameterNode(const FuncGraphPtr &func_graph, const int32_t &data,
|
||||
const std::string &node_name);
|
||||
|
|
|
@ -19,8 +19,7 @@
|
|||
#include <algorithm>
|
||||
#include "ops/mat_mul.h"
|
||||
#include "schema/inner/model_generated.h"
|
||||
#include "src/param_value_lite.h"
|
||||
#include "utils/utils.h"
|
||||
#include "tools/common/tensor_util.h"
|
||||
#include "tools/converter/quant_param_holder.h"
|
||||
#include "tools/optimizer/common/gllo_utils.h"
|
||||
#include "securec/include/securec.h"
|
||||
|
@ -52,12 +51,12 @@ void *GetInputAddr(const AnfNodePtr &node, size_t input_index) {
|
|||
}
|
||||
if (cnode->input(input_index)->isa<Parameter>()) {
|
||||
auto param_input = cnode->input(input_index)->cast<ParameterPtr>();
|
||||
auto param_value = std::dynamic_pointer_cast<ParamValueLite>(param_input->default_param());
|
||||
if (param_value == nullptr) {
|
||||
MS_LOG(ERROR) << "param not paramValueLite";
|
||||
auto tensor_info = std::dynamic_pointer_cast<tensor::Tensor>(param_input->default_param());
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "param not tensor::Tensor";
|
||||
return nullptr;
|
||||
}
|
||||
return param_value->tensor_addr();
|
||||
return tensor_info->data_c();
|
||||
}
|
||||
MS_LOG(ERROR) << "input not parameter";
|
||||
return nullptr;
|
||||
|
@ -68,42 +67,36 @@ STATUS GetRightMatmulInputParamter(const CNodePtr &stack_node, const ParameterPt
|
|||
auto joint_fullconnect_size = stack_node->inputs().size() - 1;
|
||||
auto fc = stack_node->input(1)->cast<CNodePtr>();
|
||||
auto fc_weight = fc->input(2)->cast<ParameterPtr>();
|
||||
auto fc_weight_param = std::dynamic_pointer_cast<ParamValueLite>(fc_weight->default_param());
|
||||
auto tensor_size = fc_weight_param->tensor_size();
|
||||
auto rmatmul_input_shape = fc_weight_param->tensor_shape();
|
||||
auto new_tensor_data = new (std::nothrow) int8_t[joint_fullconnect_size * tensor_size];
|
||||
if (new_tensor_data == nullptr) {
|
||||
MS_LOG(ERROR) << "tensor_data is nullptr";
|
||||
auto fc_weight_param = std::dynamic_pointer_cast<tensor::Tensor>(fc_weight->default_param());
|
||||
auto tensor_size = fc_weight_param->Size();
|
||||
auto rmatmul_input_shape = fc_weight_param->shape();
|
||||
|
||||
rmatmul_input_shape.insert(rmatmul_input_shape.begin(), joint_fullconnect_size);
|
||||
std::vector<int64_t> shape_vector(rmatmul_input_shape.begin(), rmatmul_input_shape.end());
|
||||
auto tensor_info = lite::CreateTensorInfo(nullptr, 0, shape_vector, fc_weight_param->data_type());
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "Create tensor info failed";
|
||||
return RET_ERROR;
|
||||
}
|
||||
for (size_t i = 1; i < joint_fullconnect_size + 1; i++) {
|
||||
auto tensor_addr = GetInputAddr(stack_node->input(i), 2);
|
||||
if (tensor_addr == nullptr) {
|
||||
MS_LOG(ERROR) << "input tensor addr nullptr";
|
||||
delete[] new_tensor_data;
|
||||
return RET_ERROR;
|
||||
}
|
||||
if (EOK != memcpy_s(new_tensor_data + (i - 1) * tensor_size, tensor_size, tensor_addr, tensor_size)) {
|
||||
if (EOK != memcpy_s(static_cast<int8_t *>(tensor_info->data_c()) + (i - 1) * tensor_size, tensor_size, tensor_addr,
|
||||
tensor_size)) {
|
||||
MS_LOG(ERROR) << "memcpy_s data failed";
|
||||
delete[] new_tensor_data;
|
||||
return RET_ERROR;
|
||||
}
|
||||
}
|
||||
rmatmul_input_shape.insert(rmatmul_input_shape.begin(), joint_fullconnect_size);
|
||||
auto type_ptr = TypeIdToType(fc_weight_param->tensor_type());
|
||||
std::vector<int64_t> shape_vector;
|
||||
(void)std::transform(rmatmul_input_shape.begin(), rmatmul_input_shape.end(), std::back_inserter(shape_vector),
|
||||
[](const int32_t &value) { return static_cast<int64_t>(value); });
|
||||
auto abstract_tensor = std::make_shared<abstract::AbstractTensor>(type_ptr, shape_vector);
|
||||
rmatmul_input->set_abstract(abstract_tensor);
|
||||
auto status = lite::InitParameterFromTensorInfo(rmatmul_input, tensor_info);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "init parameter from tensor info failed";
|
||||
return RET_ERROR;
|
||||
}
|
||||
rmatmul_input->set_name(stack_node->fullname_with_scope() + "right_parameter");
|
||||
ParamValueLitePtr param_value = std::make_shared<ParamValueLite>();
|
||||
MS_ASSERT(param_value != nullptr);
|
||||
param_value->set_tensor_shape(rmatmul_input_shape);
|
||||
param_value->set_tensor_type(fc_weight_param->tensor_type());
|
||||
param_value->set_format(fc_weight_param->format());
|
||||
param_value->SetTensorData(new_tensor_data, joint_fullconnect_size * tensor_size);
|
||||
rmatmul_input->set_default_param(param_value);
|
||||
|
||||
return RET_OK;
|
||||
}
|
||||
} // namespace
|
||||
|
|
|
@ -18,11 +18,11 @@
|
|||
#include <memory>
|
||||
#include <set>
|
||||
#include <vector>
|
||||
#include <algorithm>
|
||||
#include "tools/converter/quant_param_holder.h"
|
||||
#include "tools/optimizer/common/gllo_utils.h"
|
||||
#include "tools/anf_exporter/anf_exporter.h"
|
||||
#include "tools/common/node_util.h"
|
||||
#include "tools/common/tensor_util.h"
|
||||
#include "src/common/common.h"
|
||||
#include "src/ops/populate/populate_register.h"
|
||||
#include "src/kernel_registry.h"
|
||||
|
@ -85,34 +85,27 @@ ParameterPtr CreateNewParamter(const FuncGraphPtr &func_graph, Tensor *tensor) {
|
|||
auto parameter = func_graph->add_parameter();
|
||||
std::vector<int> shape(tensor->shape());
|
||||
std::vector<int64_t> shape_vector;
|
||||
(void)std::transform(shape.begin(), shape.end(), std::back_inserter(shape_vector),
|
||||
[](const int32_t &value) { return static_cast<int64_t>(value); });
|
||||
auto type_id = static_cast<TypeId>(tensor->data_type());
|
||||
auto type_ptr = TypeIdToType(type_id);
|
||||
auto abstract_tensor = std::make_shared<abstract::AbstractTensor>(type_ptr, shape_vector);
|
||||
parameter->set_abstract(abstract_tensor);
|
||||
std::transform(shape.begin(), shape.end(), std::back_inserter(shape_vector),
|
||||
[](const int32_t &value) { return static_cast<int64_t>(value); });
|
||||
|
||||
ParamValueLitePtr param_value = std::make_shared<ParamValueLite>();
|
||||
MS_ASSERT(param_value != nullptr);
|
||||
param_value->set_tensor_shape(shape);
|
||||
param_value->set_tensor_type(type_id);
|
||||
param_value->set_format(tensor->format());
|
||||
auto tensor_info = std::make_shared<tensor::Tensor>(tensor->data_type(), shape_vector);
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "create tensor info failed.";
|
||||
return nullptr;
|
||||
}
|
||||
if (tensor->MutableData() != nullptr) {
|
||||
auto size = tensor->Size();
|
||||
auto tensor_data = new (std::nothrow) uint8_t[size];
|
||||
if (tensor_data == nullptr) {
|
||||
MS_LOG(ERROR) << "tensor_data is nullptr";
|
||||
return nullptr;
|
||||
}
|
||||
auto ret = memcpy_s(tensor_data, size, tensor->MutableData(), tensor->Size());
|
||||
auto tensor_data = static_cast<uint8_t *>(tensor_info->data_c());
|
||||
auto ret = memcpy_s(tensor_data, tensor->Size(), tensor->MutableData(), tensor->Size());
|
||||
if (ret != EOK) {
|
||||
delete[] tensor_data;
|
||||
MS_LOG(ERROR) << "memcpy error: " << ret;
|
||||
return nullptr;
|
||||
}
|
||||
param_value->SetTensorData(tensor_data, size);
|
||||
}
|
||||
parameter->set_default_param(param_value);
|
||||
auto status = lite::InitParameterFromTensorInfo(parameter, tensor_info);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "init parameter from tensor info failed";
|
||||
return nullptr;
|
||||
}
|
||||
return parameter;
|
||||
}
|
||||
kernel::LiteKernel *GetLiteKernel(std::vector<Tensor *> inputs, std::vector<Tensor *> *outputs, const CNodePtr &cnode,
|
||||
|
@ -203,11 +196,11 @@ lite::STATUS CopyQuantParams(const CNodePtr &cnode, const std::vector<Tensor *>
|
|||
const std::vector<Tensor *> &outputs) {
|
||||
MS_ASSERT(cnode != nullptr);
|
||||
auto prim = GetValueNode<PrimitivePtr>(cnode->input(0));
|
||||
auto quant_param_valueptr = prim->GetAttr("quant_params");
|
||||
if (quant_param_valueptr == nullptr) {
|
||||
auto quant_tensor_info_ptr = prim->GetAttr("quant_params");
|
||||
if (quant_tensor_info_ptr == nullptr) {
|
||||
return lite::RET_OK;
|
||||
}
|
||||
auto quant_param_holder = quant_param_valueptr->cast<lite::QuantParamHolderPtr>();
|
||||
auto quant_param_holder = quant_tensor_info_ptr->cast<lite::QuantParamHolderPtr>();
|
||||
if (quant_param_holder == nullptr) {
|
||||
MS_LOG(ERROR) << "quant param is invalid.";
|
||||
return lite::RET_ERROR;
|
||||
|
|
|
@ -18,7 +18,7 @@
|
|||
#include "ops/fusion/add_fusion.h"
|
||||
#include "ops/fusion/conv2d_fusion.h"
|
||||
#include "ops/fusion/conv2d_transpose_fusion.h"
|
||||
#include "src/param_value_lite.h"
|
||||
#include "tools/common/tensor_util.h"
|
||||
#include "utils/utils.h"
|
||||
#include "tools/optimizer/common/gllo_utils.h"
|
||||
#include "securec/include/securec.h"
|
||||
|
@ -102,9 +102,9 @@ int GenConvNewBias(const FuncGraphPtr &func_graph, const CNodePtr &conv_node, co
|
|||
return lite::RET_INVALID_OP_ATTR;
|
||||
}
|
||||
auto add_weight_param = bias_add_weight->cast<ParameterPtr>()->default_param();
|
||||
auto add_weight_tensor = std::dynamic_pointer_cast<ParamValueLite>(add_weight_param);
|
||||
auto add_weight_data = reinterpret_cast<float *>(add_weight_tensor->tensor_addr());
|
||||
auto add_weight_shape = add_weight_tensor->tensor_shape();
|
||||
auto add_weight_tensor = std::dynamic_pointer_cast<tensor::Tensor>(add_weight_param);
|
||||
auto add_weight_data = reinterpret_cast<float *>(add_weight_tensor->data_c());
|
||||
auto add_weight_shape = add_weight_tensor->shape();
|
||||
if (add_weight_shape.empty() || (add_weight_shape.size() == 1 && add_weight_shape[0] == 1)) {
|
||||
for (int i = 0; i < kernel_nums; i++) {
|
||||
add_bias_data[i] = *add_weight_data;
|
||||
|
@ -122,20 +122,20 @@ int GenConvNewBias(const FuncGraphPtr &func_graph, const CNodePtr &conv_node, co
|
|||
return lite::RET_INVALID_OP_ATTR;
|
||||
}
|
||||
auto conv_bias_param = conv_bias_node->cast<ParameterPtr>()->default_param();
|
||||
auto conv_bias_tensor = std::dynamic_pointer_cast<ParamValueLite>(conv_bias_param);
|
||||
if (conv_bias_tensor->tensor_shape().empty() || conv_bias_tensor->tensor_shape()[0] != kernel_nums) {
|
||||
auto conv_bias_tensor = std::dynamic_pointer_cast<tensor::Tensor>(conv_bias_param);
|
||||
if (conv_bias_tensor->shape().empty() || conv_bias_tensor->shape()[0] != kernel_nums) {
|
||||
MS_LOG(ERROR) << "conv_bias_node shape error";
|
||||
delete[] add_bias_data;
|
||||
return lite::RET_INVALID_OP_ATTR;
|
||||
}
|
||||
auto conv_bias_data = reinterpret_cast<float *>(conv_bias_tensor->tensor_addr());
|
||||
auto conv_bias_data = reinterpret_cast<float *>(conv_bias_tensor->data_c());
|
||||
for (int i = 0; i < kernel_nums; i++) {
|
||||
conv_bias_data[i] += add_bias_data[i];
|
||||
}
|
||||
delete[] add_bias_data;
|
||||
} else {
|
||||
auto conv_weight_param = conv_weight_node->cast<ParameterPtr>()->default_param();
|
||||
auto conv_weight_tensor = std::dynamic_pointer_cast<ParamValueLite>(conv_weight_param);
|
||||
auto conv_weight_tensor = std::dynamic_pointer_cast<tensor::Tensor>(conv_weight_param);
|
||||
auto conv_new_bias = AddNewBiasNode(add_bias_data, func_graph, kernel_nums, conv_weight_tensor);
|
||||
conv_new_bias->set_name(conv_node->fullname_with_scope() + "_bias");
|
||||
conv_node->add_input(conv_new_bias);
|
||||
|
|
|
@ -18,7 +18,6 @@
|
|||
#include <memory>
|
||||
#include "ops/batch_norm.h"
|
||||
#include "ops/fused_batch_norm.h"
|
||||
#include "src/param_value_lite.h"
|
||||
#include "utils/utils.h"
|
||||
#include "tools/optimizer/common/gllo_utils.h"
|
||||
#include "securec/include/securec.h"
|
||||
|
@ -46,8 +45,8 @@ bool IsBatchNode(const BaseRef &n) {
|
|||
void CalTransale(const AnfNodePtr &bn_scale_node, const AnfNodePtr &bn_var_node, float *trans_scale, float eps,
|
||||
int kernel_num) {
|
||||
auto bn_var_param = bn_var_node->cast<ParameterPtr>()->default_param();
|
||||
auto bn_var_tensor = std::dynamic_pointer_cast<ParamValueLite>(bn_var_param);
|
||||
auto bn_var_data = reinterpret_cast<float *>(bn_var_tensor->tensor_addr());
|
||||
auto bn_var_tensor = std::dynamic_pointer_cast<tensor::Tensor>(bn_var_param);
|
||||
auto bn_var_data = reinterpret_cast<float *>(bn_var_tensor->data_c());
|
||||
// cal transScale, tf : scale/sqrt(variance + eps); caffe : 1/sqrt(variance + eps)
|
||||
if (memcpy_s(trans_scale, kernel_num * sizeof(float), bn_var_data, kernel_num * sizeof(float)) != EOK) {
|
||||
MS_LOG(ERROR) << "memcpy_s transScale error";
|
||||
|
@ -67,8 +66,8 @@ void CalTransale(const AnfNodePtr &bn_scale_node, const AnfNodePtr &bn_var_node,
|
|||
}
|
||||
if (bn_scale_node != nullptr) {
|
||||
auto bn_scale_param = bn_scale_node->cast<ParameterPtr>()->default_param();
|
||||
auto bn_scale_tensor = std::dynamic_pointer_cast<ParamValueLite>(bn_scale_param);
|
||||
auto bn_scale_data = reinterpret_cast<float *>(bn_scale_tensor->tensor_addr());
|
||||
auto bn_scale_tensor = std::dynamic_pointer_cast<tensor::Tensor>(bn_scale_param);
|
||||
auto bn_scale_data = reinterpret_cast<float *>(bn_scale_tensor->data_c());
|
||||
// scale/sqrt(variance + eps)
|
||||
for (int32_t i = 0; i < kernel_num; i++) {
|
||||
trans_scale[i] *= bn_scale_data[i];
|
||||
|
@ -78,8 +77,8 @@ void CalTransale(const AnfNodePtr &bn_scale_node, const AnfNodePtr &bn_var_node,
|
|||
void CalTransBias(const AnfNodePtr &bn_mean_node, const AnfNodePtr &bn_bias_node, const float *trans_scale,
|
||||
float *trans_bias, int kernel_num) {
|
||||
auto bn_mean_param = bn_mean_node->cast<ParameterPtr>()->default_param();
|
||||
auto bn_mean_tensor = std::dynamic_pointer_cast<ParamValueLite>(bn_mean_param);
|
||||
auto bn_mean_data = reinterpret_cast<float *>(bn_mean_tensor->tensor_addr());
|
||||
auto bn_mean_tensor = std::dynamic_pointer_cast<tensor::Tensor>(bn_mean_param);
|
||||
auto bn_mean_data = reinterpret_cast<float *>(bn_mean_tensor->data_c());
|
||||
// cal transBias, tf : -scale*mean/sqrt(variance + eps) + bias; caffe : -mean/sqrt(variance + eps)
|
||||
// -mean/sqrt(variance + eps)
|
||||
for (int32_t i = 0; i < kernel_num; i++) {
|
||||
|
@ -88,8 +87,8 @@ void CalTransBias(const AnfNodePtr &bn_mean_node, const AnfNodePtr &bn_bias_node
|
|||
|
||||
if (bn_bias_node != nullptr) {
|
||||
auto bn_bias_param = bn_bias_node->cast<ParameterPtr>()->default_param();
|
||||
auto bn_bias_tensor = std::dynamic_pointer_cast<ParamValueLite>(bn_bias_param);
|
||||
auto bn_bias_data = reinterpret_cast<float *>(bn_bias_tensor->tensor_addr());
|
||||
auto bn_bias_tensor = std::dynamic_pointer_cast<tensor::Tensor>(bn_bias_param);
|
||||
auto bn_bias_data = reinterpret_cast<float *>(bn_bias_tensor->data_c());
|
||||
// -scale*mean/sqrt(variance + eps) + bias
|
||||
for (int32_t i = 0; i < kernel_num; i++) {
|
||||
trans_bias[i] += bn_bias_data[i];
|
||||
|
@ -108,18 +107,18 @@ STATUS CalEstimatedData(const AnfNodePtr &origin_node, const AnfNodePtr &scale_f
|
|||
return RET_ERROR;
|
||||
}
|
||||
auto origin_param = origin_node->cast<ParameterPtr>()->default_param();
|
||||
auto origin_tensor = std::dynamic_pointer_cast<ParamValueLite>(origin_param);
|
||||
auto origin_data = reinterpret_cast<float *>(origin_tensor->tensor_addr());
|
||||
auto origin_tensor = std::dynamic_pointer_cast<tensor::Tensor>(origin_param);
|
||||
auto origin_data = reinterpret_cast<float *>(origin_tensor->data_c());
|
||||
|
||||
auto scale_factor_param = scale_factor_node->cast<ParameterPtr>()->default_param();
|
||||
auto scale_factor_tensor = std::dynamic_pointer_cast<ParamValueLite>(scale_factor_param);
|
||||
if (scale_factor_tensor->tensor_shape_size() < 1) {
|
||||
auto scale_factor_tensor = std::dynamic_pointer_cast<tensor::Tensor>(scale_factor_param);
|
||||
if (scale_factor_tensor->DataSize() < 1) {
|
||||
MS_LOG(ERROR) << "scale factor data size is not equal to 1";
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto scale_factor_data = (reinterpret_cast<float *>(scale_factor_tensor->tensor_addr()))[0];
|
||||
auto scale_factor_data = (reinterpret_cast<float *>(scale_factor_tensor->data_c()))[0];
|
||||
float scale_factor = scale_factor_data == 0 ? 0 : 1 / scale_factor_data;
|
||||
for (int i = 0; i < origin_tensor->tensor_shape_size(); i++) {
|
||||
for (int i = 0; i < origin_tensor->DataSize(); i++) {
|
||||
origin_data[i] = origin_data[i] * scale_factor;
|
||||
}
|
||||
return RET_OK;
|
||||
|
|
|
@ -15,9 +15,9 @@
|
|||
*/
|
||||
|
||||
#include "tools/optimizer/fusion/conv_conv_fusion.h"
|
||||
#include <functional>
|
||||
#include <memory>
|
||||
#include <vector>
|
||||
#include "tools/common/tensor_util.h"
|
||||
#include "ops/fusion/conv2d_fusion.h"
|
||||
#include "tools/optimizer/common/gllo_utils.h"
|
||||
|
||||
|
@ -57,33 +57,33 @@ STATUS GenNewConvBias(const ParameterPtr &down_bias_node, const ParameterPtr &do
|
|||
const ParameterPtr &up_bias_node, const ParameterPtr &new_bias_node) {
|
||||
float *down_bias_data = nullptr;
|
||||
if (down_bias_node != nullptr) {
|
||||
auto down_bias_param = std::dynamic_pointer_cast<ParamValueLite>(down_bias_node->default_param());
|
||||
auto down_bias_shape = down_bias_param->tensor_shape();
|
||||
auto down_bias_param = std::dynamic_pointer_cast<tensor::Tensor>(down_bias_node->default_param());
|
||||
auto down_bias_shape = down_bias_param->shape();
|
||||
if (down_bias_shape.size() != 1) {
|
||||
MS_LOG(ERROR) << "cur conv_conv fusion only support scalar bias shape";
|
||||
return RET_FAILED;
|
||||
}
|
||||
down_bias_data = static_cast<float *>(down_bias_param->tensor_addr());
|
||||
down_bias_data = static_cast<float *>(down_bias_param->data_c());
|
||||
}
|
||||
auto up_bias_param = std::dynamic_pointer_cast<ParamValueLite>(up_bias_node->default_param());
|
||||
auto up_bias_shape = up_bias_param->tensor_shape();
|
||||
auto up_bias_param = std::dynamic_pointer_cast<tensor::Tensor>(up_bias_node->default_param());
|
||||
auto up_bias_shape = up_bias_param->shape();
|
||||
if (up_bias_shape.size() != 1) {
|
||||
MS_LOG(ERROR) << "cur conv_conv fusion only support scalar bias shape";
|
||||
return RET_FAILED;
|
||||
}
|
||||
auto down_weight_param = std::dynamic_pointer_cast<ParamValueLite>(down_weight_node->default_param());
|
||||
auto down_weight_data = static_cast<float *>(down_weight_param->tensor_addr());
|
||||
auto down_weight_shape = down_weight_param->tensor_shape();
|
||||
auto up_bias_data = static_cast<float *>(up_bias_param->tensor_addr());
|
||||
auto down_weight_param = std::dynamic_pointer_cast<tensor::Tensor>(down_weight_node->default_param());
|
||||
auto down_weight_data = static_cast<float *>(down_weight_param->data_c());
|
||||
auto down_weight_shape = down_weight_param->shape();
|
||||
auto up_bias_data = static_cast<float *>(up_bias_param->data_c());
|
||||
int new_bias_size = down_weight_shape[0];
|
||||
auto new_bias_data = new (std::nothrow) float[new_bias_size];
|
||||
if (new_bias_data == nullptr) {
|
||||
MS_LOG(ERROR) << "tensor_data is nullptr";
|
||||
auto tensor_info = lite::CreateTensorInfo(nullptr, 0, {new_bias_size}, up_bias_param->data_type());
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "create tensor info failed.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto new_bias_data = static_cast<float *>(tensor_info->data_c());
|
||||
if (memset_s(new_bias_data, new_bias_size * sizeof(float), 0, new_bias_size * sizeof(float)) != EOK) {
|
||||
MS_LOG(ERROR) << "memset_s failed";
|
||||
delete[] new_bias_data;
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto up_bias_size = up_bias_shape[0];
|
||||
|
@ -95,43 +95,33 @@ STATUS GenNewConvBias(const ParameterPtr &down_bias_node, const ParameterPtr &do
|
|||
new_bias_data[i] += down_bias_data[i];
|
||||
}
|
||||
}
|
||||
ParamValueLitePtr param_value = std::make_shared<ParamValueLite>();
|
||||
MS_ASSERT(param_value != nullptr);
|
||||
param_value->set_tensor_shape({new_bias_size});
|
||||
param_value->set_tensor_type(up_bias_param->tensor_type());
|
||||
param_value->set_format(up_bias_param->format());
|
||||
param_value->SetTensorData(new_bias_data, sizeof(float) * new_bias_size);
|
||||
|
||||
new_bias_node->set_name(down_bias_node->fullname_with_scope());
|
||||
new_bias_node->set_default_param(param_value);
|
||||
new_bias_node->set_default_param(tensor_info);
|
||||
new_bias_node->set_abstract(down_bias_node->abstract());
|
||||
return RET_OK;
|
||||
}
|
||||
// up weight shape[cout0,h,w,cin0] down weight shape[cout1,1,1,cout0],new weight shape [cout1,h,w,cin0]
|
||||
STATUS GenNewConvWeight(const ParameterPtr &down_weight_node, const ParameterPtr &up_weight_node,
|
||||
const ParameterPtr &new_weight_node) {
|
||||
auto down_weight_param = std::dynamic_pointer_cast<ParamValueLite>(down_weight_node->default_param());
|
||||
auto down_weight_shape = down_weight_param->tensor_shape();
|
||||
auto up_weight_param = std::dynamic_pointer_cast<ParamValueLite>(up_weight_node->default_param());
|
||||
auto up_weight_shape = up_weight_param->tensor_shape();
|
||||
auto up_weight_data = static_cast<float *>(up_weight_param->tensor_addr());
|
||||
auto down_weight_data = static_cast<float *>(down_weight_param->tensor_addr());
|
||||
auto down_weight_param = std::dynamic_pointer_cast<tensor::Tensor>(down_weight_node->default_param());
|
||||
auto down_weight_shape = down_weight_param->shape();
|
||||
auto up_weight_param = std::dynamic_pointer_cast<tensor::Tensor>(up_weight_node->default_param());
|
||||
auto up_weight_shape = up_weight_param->shape();
|
||||
auto up_weight_data = static_cast<float *>(up_weight_param->data_c());
|
||||
auto down_weight_data = static_cast<float *>(down_weight_param->data_c());
|
||||
int cout0 = up_weight_shape[0];
|
||||
int cin0 = up_weight_shape[kNHWC_CDim];
|
||||
int cout1 = down_weight_shape[0];
|
||||
int window_size = up_weight_shape[kNHWC_WDim] * up_weight_shape[kNHWC_HDim];
|
||||
auto new_weight_shape = up_weight_shape;
|
||||
new_weight_shape[0] = down_weight_shape[0];
|
||||
int size = std::accumulate(new_weight_shape.begin(), new_weight_shape.end(), 1, std::multiplies<>());
|
||||
auto new_weight_data = new (std::nothrow) float[size];
|
||||
if (new_weight_data == nullptr) {
|
||||
MS_LOG(ERROR) << "tensor_data is nullptr";
|
||||
return RET_ERROR;
|
||||
}
|
||||
if (memset_s(new_weight_data, size * sizeof(float), 0, size * sizeof(float)) != EOK) {
|
||||
MS_LOG(ERROR) << "memset_s failed";
|
||||
delete[] new_weight_data;
|
||||
auto tensor_info = lite::CreateTensorInfo(nullptr, 0, new_weight_shape, up_weight_param->data_type());
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "create tensor info failed.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto new_weight_data = static_cast<float *>(tensor_info->data_c());
|
||||
for (int i = 0; i < cout1; i++) {
|
||||
auto down_weight_base = i * cout0;
|
||||
auto new_weight_base = i * window_size * cin0;
|
||||
|
@ -148,14 +138,9 @@ STATUS GenNewConvWeight(const ParameterPtr &down_weight_node, const ParameterPtr
|
|||
}
|
||||
}
|
||||
}
|
||||
ParamValueLitePtr param_value = std::make_shared<ParamValueLite>();
|
||||
MS_ASSERT(param_value != nullptr);
|
||||
param_value->set_tensor_shape(new_weight_shape);
|
||||
param_value->set_tensor_type(up_weight_param->tensor_type());
|
||||
param_value->set_format(up_weight_param->format());
|
||||
param_value->SetTensorData(new_weight_data, sizeof(float) * size);
|
||||
|
||||
new_weight_node->set_name(down_weight_node->fullname_with_scope());
|
||||
new_weight_node->set_default_param(param_value);
|
||||
new_weight_node->set_default_param(tensor_info);
|
||||
new_weight_node->set_abstract(down_weight_node->abstract());
|
||||
return RET_OK;
|
||||
}
|
||||
|
@ -230,9 +215,9 @@ const AnfNodePtr ConvConvFusion::Process(const FuncGraphPtr &func_graph, const A
|
|||
return nullptr;
|
||||
}
|
||||
auto down_weight_parameter = down_conv_cnode->input(kConvWeightIndex)->cast<ParameterPtr>();
|
||||
auto down_weight_value = std::dynamic_pointer_cast<ParamValueLite>(down_weight_parameter->default_param());
|
||||
auto down_weight_shape = down_weight_value->tensor_shape();
|
||||
auto down_weight_type = down_weight_value->tensor_type();
|
||||
auto down_weight_value = std::dynamic_pointer_cast<tensor::Tensor>(down_weight_parameter->default_param());
|
||||
auto down_weight_shape = down_weight_value->shape();
|
||||
auto down_weight_type = down_weight_value->data_type();
|
||||
// down conv node filter must 1x1,only support float32
|
||||
if (down_weight_shape.size() != kNHWC_DIMS || down_weight_type != kNumberTypeFloat32 ||
|
||||
(down_weight_shape[kNHWC_HDim] != 1 || down_weight_shape[kNHWC_WDim] != 1)) {
|
||||
|
@ -241,9 +226,9 @@ const AnfNodePtr ConvConvFusion::Process(const FuncGraphPtr &func_graph, const A
|
|||
|
||||
auto up_conv_cnode = down_conv_cnode->input(1)->cast<CNodePtr>();
|
||||
auto up_weight_parameter = up_conv_cnode->input(kConvWeightIndex)->cast<ParameterPtr>();
|
||||
auto up_weight_value = std::dynamic_pointer_cast<ParamValueLite>(up_weight_parameter->default_param());
|
||||
auto up_weight_shape = up_weight_value->tensor_shape();
|
||||
auto up_weight_type = up_weight_value->tensor_type();
|
||||
auto up_weight_value = std::dynamic_pointer_cast<tensor::Tensor>(up_weight_parameter->default_param());
|
||||
auto up_weight_shape = up_weight_value->shape();
|
||||
auto up_weight_type = up_weight_value->data_type();
|
||||
if (up_weight_shape.size() != kNHWC_DIMS || up_weight_type != kNumberTypeFloat32 ||
|
||||
(up_weight_shape[kNHWC_HDim] != 1 || up_weight_shape[kNHWC_WDim] != 1)) {
|
||||
return nullptr;
|
||||
|
|
|
@ -16,7 +16,6 @@
|
|||
|
||||
#include "tools/optimizer/fusion/conv_scale_fusion.h"
|
||||
#include <memory>
|
||||
#include "src/param_value_lite.h"
|
||||
#include "tools/optimizer/common/gllo_utils.h"
|
||||
#include "securec/include/securec.h"
|
||||
|
||||
|
@ -70,8 +69,8 @@ void ConvScaleFusion::InitTransParam(const CNodePtr &scale_node, int kernel_num,
|
|||
return;
|
||||
}
|
||||
auto scale_weight_param = scale_weight_node->cast<ParameterPtr>()->default_param();
|
||||
auto weight_value = std::dynamic_pointer_cast<ParamValueLite>(scale_weight_param);
|
||||
auto weight_data = reinterpret_cast<const float *>(weight_value->tensor_addr());
|
||||
auto weight_value = std::dynamic_pointer_cast<tensor::Tensor>(scale_weight_param);
|
||||
auto weight_data = reinterpret_cast<const float *>(weight_value->data_c());
|
||||
|
||||
if (EOK != memcpy_s(trans_scale, kernel_num * sizeof(float), weight_data, kernel_num * sizeof(float))) {
|
||||
MS_LOG(ERROR) << "memcpy_s transScale failed";
|
||||
|
@ -81,8 +80,8 @@ void ConvScaleFusion::InitTransParam(const CNodePtr &scale_node, int kernel_num,
|
|||
|
||||
if (scale_bias_node != nullptr) {
|
||||
auto scale_bias_param = scale_bias_node->cast<ParameterPtr>()->default_param();
|
||||
auto bias_value = std::dynamic_pointer_cast<ParamValueLite>(scale_bias_param);
|
||||
auto bias_data = reinterpret_cast<const float *>(bias_value->tensor_addr());
|
||||
auto bias_value = std::dynamic_pointer_cast<tensor::Tensor>(scale_bias_param);
|
||||
auto bias_data = reinterpret_cast<const float *>(bias_value->data_c());
|
||||
if (EOK != memcpy_s(trans_bias, kernel_num * sizeof(float), bias_data, kernel_num * sizeof(float))) {
|
||||
MS_LOG(ERROR) << "memcpy_s transScale failed";
|
||||
lite::ReturnCode::GetSingleReturnCode()->UpdateReturnCode(lite::RET_MEMORY_FAILED);
|
||||
|
|
|
@ -18,7 +18,7 @@
|
|||
#include <memory>
|
||||
#include "ops/fusion/conv2d_fusion.h"
|
||||
#include "ops/fusion/conv2d_transpose_fusion.h"
|
||||
#include "src/param_value_lite.h"
|
||||
#include "tools/common/tensor_util.h"
|
||||
#include "tools/optimizer/common/gllo_utils.h"
|
||||
#include "securec/include/securec.h"
|
||||
|
||||
|
@ -70,14 +70,14 @@ void GenerateNewWeightConv2D(float *dst_weight, const float *conv_weight, const
|
|||
}
|
||||
|
||||
void GenerateNewWeightConv2DTranspose(float *dst_weight, const float *scale_weight,
|
||||
const ParamValueLitePtr &weight_tensor, FmkType fmk, int group, int kernel_num) {
|
||||
const tensor::TensorPtr &weight_tensor, FmkType fmk, int group, int kernel_num) {
|
||||
if (dst_weight == nullptr || scale_weight == nullptr || weight_tensor == nullptr) {
|
||||
return;
|
||||
}
|
||||
auto weight_data = reinterpret_cast<float *>(weight_tensor->tensor_addr());
|
||||
auto weight_data = reinterpret_cast<float *>(weight_tensor->data_c());
|
||||
if (fmk == lite::converter::FmkType_TF) {
|
||||
auto cin_group = weight_tensor->tensor_shape()[3] / group;
|
||||
int area_size = weight_tensor->tensor_shape()[0] * weight_tensor->tensor_shape()[1];
|
||||
auto cin_group = weight_tensor->shape()[3] / group;
|
||||
int area_size = weight_tensor->shape()[0] * weight_tensor->shape()[1];
|
||||
for (int j = 0; j < area_size; j++) {
|
||||
for (int i = 0; i < kernel_num; ++i) {
|
||||
for (int k = 0; k < cin_group; ++k) {
|
||||
|
@ -87,8 +87,8 @@ void GenerateNewWeightConv2DTranspose(float *dst_weight, const float *scale_weig
|
|||
}
|
||||
}
|
||||
} else {
|
||||
auto cin_group = weight_tensor->tensor_shape()[0] / group;
|
||||
int area_size = weight_tensor->tensor_shape()[2] * weight_tensor->tensor_shape()[3];
|
||||
auto cin_group = weight_tensor->shape()[0] / group;
|
||||
int area_size = weight_tensor->shape()[2] * weight_tensor->shape()[3];
|
||||
int cout_size = kernel_num * area_size;
|
||||
for (int k = 0; k < cin_group; ++k) {
|
||||
for (int i = 0; i < kernel_num; ++i) {
|
||||
|
@ -197,50 +197,31 @@ void ConvTransformFusion::GenNewConvTensor(const FuncGraphPtr &func_graph, const
|
|||
return;
|
||||
}
|
||||
auto conv_weight_param = conv_weight_node->cast<ParameterPtr>()->default_param();
|
||||
auto weight_tensor = std::dynamic_pointer_cast<ParamValueLite>(conv_weight_param);
|
||||
auto weight_tensor = std::dynamic_pointer_cast<tensor::Tensor>(conv_weight_param);
|
||||
if (kernel_num <= 0) {
|
||||
MS_LOG(ERROR) << "kernel num less than 0";
|
||||
lite::ReturnCode::GetSingleReturnCode()->UpdateReturnCode(lite::RET_INVALID_OP_ATTR);
|
||||
return;
|
||||
}
|
||||
auto temp_weight_data = new (std::nothrow) float[weight_tensor->tensor_shape_size()];
|
||||
if (temp_weight_data == nullptr) {
|
||||
MS_LOG(ERROR) << "new ParamValueLite failed";
|
||||
lite::ReturnCode::GetSingleReturnCode()->UpdateReturnCode(lite::RET_ERROR);
|
||||
return;
|
||||
}
|
||||
auto new_weight_tensor = std::make_shared<ParamValueLite>();
|
||||
auto new_weight_tensor = lite::CreateTensorInfo(weight_tensor->data_c(), weight_tensor->DataSize() * sizeof(float),
|
||||
weight_tensor->shape(), weight_tensor->data_type());
|
||||
if (new_weight_tensor == nullptr) {
|
||||
delete temp_weight_data;
|
||||
MS_LOG(ERROR) << "new ParamValueLite failed";
|
||||
MS_LOG(ERROR) << "create tensor info failed.";
|
||||
return;
|
||||
}
|
||||
new_weight_tensor->set_tensor_size(weight_tensor->tensor_size());
|
||||
new_weight_tensor->set_tensor_shape(weight_tensor->tensor_shape());
|
||||
new_weight_tensor->set_tensor_type(weight_tensor->tensor_type());
|
||||
new_weight_tensor->set_format(weight_tensor->format());
|
||||
auto ret = memcpy_s(temp_weight_data, weight_tensor->tensor_shape_size() * sizeof(float),
|
||||
weight_tensor->tensor_addr(), weight_tensor->tensor_shape_size() * sizeof(float));
|
||||
if (ret != EOK) {
|
||||
delete temp_weight_data;
|
||||
MS_LOG(ERROR) << "memcpy_s error:" << ret;
|
||||
return;
|
||||
}
|
||||
new_weight_tensor->SetTensorData(temp_weight_data, new_weight_tensor->tensor_size());
|
||||
CalNewWeightTensor(conv_node, new_weight_tensor, kernel_num, trans_scale);
|
||||
float *bias_data = nullptr;
|
||||
// conv has bias,bias_flag true
|
||||
bool bias_flag = false;
|
||||
if (conv_bias_node != nullptr) {
|
||||
auto conv_bias_param = conv_bias_node->cast<ParameterPtr>()->default_param();
|
||||
auto bias_tensor = std::dynamic_pointer_cast<ParamValueLite>(conv_bias_param);
|
||||
bias_data = reinterpret_cast<float *>(bias_tensor->tensor_addr());
|
||||
auto bias_tensor = std::dynamic_pointer_cast<tensor::Tensor>(conv_bias_param);
|
||||
bias_data = reinterpret_cast<float *>(bias_tensor->data_c());
|
||||
bias_flag = true;
|
||||
} else {
|
||||
bias_data = new (std::nothrow) float[kernel_num];
|
||||
if (bias_data == nullptr) {
|
||||
MS_LOG(ERROR) << "tensor_data is nullptr";
|
||||
delete temp_weight_data;
|
||||
return;
|
||||
}
|
||||
}
|
||||
|
@ -253,7 +234,6 @@ void ConvTransformFusion::GenNewConvTensor(const FuncGraphPtr &func_graph, const
|
|||
auto new_weight_paramter = func_graph->add_parameter();
|
||||
if (new_weight_paramter == nullptr) {
|
||||
MS_LOG(ERROR) << "new_weight_paramter is nullptr";
|
||||
delete temp_weight_data;
|
||||
return;
|
||||
}
|
||||
new_weight_paramter->set_default_param(new_weight_tensor);
|
||||
|
@ -262,15 +242,15 @@ void ConvTransformFusion::GenNewConvTensor(const FuncGraphPtr &func_graph, const
|
|||
conv_node->set_input(kConvWeightIndex, new_weight_paramter);
|
||||
}
|
||||
|
||||
void ConvTransformFusion::CalNewWeightTensor(const CNodePtr &conv_node, const ParamValueLitePtr &weight_tensor,
|
||||
void ConvTransformFusion::CalNewWeightTensor(const CNodePtr &conv_node, const tensor::TensorPtr &weight_tensor,
|
||||
int kernel_num, const float *trans_scale) const {
|
||||
MS_ASSERT(weight_data != nullptr);
|
||||
MS_ASSERT(trans_scale != nullptr);
|
||||
if (weight_tensor->tensor_shape().size() != 4) {
|
||||
if (weight_tensor->shape().size() != 4) {
|
||||
MS_LOG(ERROR) << "weight tensor shape error";
|
||||
return;
|
||||
}
|
||||
auto weight_shape_size = weight_tensor->tensor_shape_size();
|
||||
auto weight_shape_size = weight_tensor->DataSize();
|
||||
auto tmp_weight_data = new (std::nothrow) float[weight_shape_size];
|
||||
if (tmp_weight_data == nullptr) {
|
||||
lite::ReturnCode::GetSingleReturnCode()->UpdateReturnCode(lite::RET_MEMORY_FAILED);
|
||||
|
@ -284,7 +264,7 @@ void ConvTransformFusion::CalNewWeightTensor(const CNodePtr &conv_node, const Pa
|
|||
lite::ReturnCode::GetSingleReturnCode()->UpdateReturnCode(lite::RET_MEMORY_FAILED);
|
||||
return;
|
||||
}
|
||||
auto weight_data = reinterpret_cast<float *>(weight_tensor->tensor_addr());
|
||||
auto weight_data = reinterpret_cast<float *>(weight_tensor->data_c());
|
||||
auto conv_prim = GetValueNode<PrimitivePtr>(conv_node->input(0));
|
||||
MS_ASSERT(conv_prim != nullptr);
|
||||
bool is_depth_wise =
|
||||
|
|
|
@ -20,7 +20,6 @@
|
|||
#include <string>
|
||||
#include "backend/optimizer/common/optimizer.h"
|
||||
#include "tools/converter/converter_flags.h"
|
||||
#include "src/param_value_lite.h"
|
||||
|
||||
using mindspore::lite::converter::FmkType;
|
||||
namespace mindspore::opt {
|
||||
|
@ -33,7 +32,7 @@ class ConvTransformFusion : public PatternProcessPass {
|
|||
void GenTransParam(const CNodePtr &, int, float *, float *) const;
|
||||
virtual void InitTransParam(const CNodePtr &, int, float *, float *) const = 0;
|
||||
void GenNewConvTensor(const FuncGraphPtr &, const CNodePtr &, int, const float *, const float *) const;
|
||||
void CalNewWeightTensor(const CNodePtr &, const ParamValueLitePtr &, int, const float *) const;
|
||||
void CalNewWeightTensor(const CNodePtr &, const tensor::TensorPtr &, int, const float *) const;
|
||||
void CalNewBiasTensor(float *, int, bool, const float *, const float *) const;
|
||||
void SetFmkType(FmkType type) { this->fmk_type_ = type; }
|
||||
|
||||
|
|
|
@ -15,7 +15,6 @@
|
|||
*/
|
||||
#include "tools/optimizer/fusion/conv_tuplegetitem_fusion.h"
|
||||
#include <memory>
|
||||
#include "src/param_value_lite.h"
|
||||
#include "tools/optimizer/common/gllo_utils.h"
|
||||
#include "securec/include/securec.h"
|
||||
|
||||
|
|
|
@ -49,17 +49,17 @@ const float GeLUFusion::GetParameterValue(const EquivPtr &equiv, const VarPtr &i
|
|||
if (!parameter_node->has_default() || parameter_node->default_param() == nullptr) {
|
||||
return value;
|
||||
}
|
||||
auto param_value_lite = parameter_node->default_param()->cast<ParamValueLitePtr>();
|
||||
auto param_value_lite = parameter_node->default_param()->cast<tensor::TensorPtr>();
|
||||
if (param_value_lite == nullptr) {
|
||||
return value;
|
||||
}
|
||||
if (param_value_lite->tensor_type() != kNumberTypeFloat32 && param_value_lite->tensor_type() != kNumberTypeFloat) {
|
||||
if (param_value_lite->data_type() != kNumberTypeFloat32 && param_value_lite->data_type() != kNumberTypeFloat) {
|
||||
return value;
|
||||
}
|
||||
if (param_value_lite->tensor_size() != sizeof(float)) {
|
||||
if (param_value_lite->Size() != sizeof(float)) {
|
||||
return value;
|
||||
}
|
||||
return *static_cast<float *>(param_value_lite->tensor_addr());
|
||||
return *static_cast<float *>(param_value_lite->data_c());
|
||||
}
|
||||
|
||||
const AnfNodePtr GeLUFusion::Process(const FuncGraphPtr &func_graph, const AnfNodePtr &node,
|
||||
|
|
|
@ -18,7 +18,6 @@
|
|||
#include "ops/fusion/layer_norm_fusion.h"
|
||||
#include "ops/fusion/reduce_fusion.h"
|
||||
#include "mindspore/core/ops/instance_norm.h"
|
||||
#include "src/param_value_lite.h"
|
||||
#include "utils/utils.h"
|
||||
#include "tools/optimizer/common/gllo_utils.h"
|
||||
#include "securec/include/securec.h"
|
||||
|
@ -33,13 +32,12 @@ STATUS GetReduceAxes(const BaseRef &n, std::vector<int> *axes) {
|
|||
if (!axes_param->has_default() || axes_param->default_param() == nullptr) {
|
||||
return lite::RET_NOT_SUPPORT;
|
||||
}
|
||||
auto axes_value = axes_param->default_param()->cast<ParamValueLitePtr>();
|
||||
auto axes_value = axes_param->default_param()->cast<tensor::TensorPtr>();
|
||||
if (axes_value == nullptr) {
|
||||
return lite::RET_ERROR;
|
||||
}
|
||||
axes->resize(axes_value->tensor_shape()[0]);
|
||||
if (memcpy_s(axes->data(), axes_value->tensor_size(), axes_value->tensor_addr(), axes_value->tensor_size()) ==
|
||||
EOK) {
|
||||
axes->resize(axes_value->shape()[0]);
|
||||
if (memcpy_s(axes->data(), axes_value->Size(), axes_value->data_c(), axes_value->Size()) == EOK) {
|
||||
return lite::RET_OK;
|
||||
}
|
||||
}
|
||||
|
@ -174,8 +172,10 @@ bool NormFusion::CheckPattern(const EquivPtr &equiv, schema::PrimitiveType *type
|
|||
return false;
|
||||
}
|
||||
auto beta_param = beta_node->cast<ParameterPtr>()->default_param();
|
||||
auto beta_tensor = std::dynamic_pointer_cast<ParamValueLite>(beta_param);
|
||||
auto beta_shape = beta_tensor->tensor_shape();
|
||||
auto beta_tensor = std::dynamic_pointer_cast<tensor::Tensor>(beta_param);
|
||||
std::vector<int> beta_shape;
|
||||
std::transform(beta_tensor->shape().begin(), beta_tensor->shape().end(), std::back_inserter(beta_shape),
|
||||
[](int64_t val) { return static_cast<int>(val); });
|
||||
// gamma
|
||||
auto gamma_node = utils::cast<AnfNodePtr>((*equiv)[gamma_]);
|
||||
MS_ASSERT(gamma_node != nullptr);
|
||||
|
@ -183,8 +183,10 @@ bool NormFusion::CheckPattern(const EquivPtr &equiv, schema::PrimitiveType *type
|
|||
return false;
|
||||
}
|
||||
auto gamma_param = gamma_node->cast<ParameterPtr>()->default_param();
|
||||
auto gamma_tensor = std::dynamic_pointer_cast<ParamValueLite>(gamma_param);
|
||||
auto gamma_shape = gamma_tensor->tensor_shape();
|
||||
auto gamma_tensor = std::dynamic_pointer_cast<tensor::Tensor>(gamma_param);
|
||||
std::vector<int> gamma_shape;
|
||||
std::transform(gamma_tensor->shape().begin(), gamma_tensor->shape().end(), std::back_inserter(gamma_shape),
|
||||
[](int64_t val) { return static_cast<int>(val); });
|
||||
// epsilon
|
||||
auto epsilon_node = utils::cast<AnfNodePtr>((*equiv)[epsilon_]);
|
||||
MS_ASSERT(epsilon_node != nullptr);
|
||||
|
@ -192,9 +194,9 @@ bool NormFusion::CheckPattern(const EquivPtr &equiv, schema::PrimitiveType *type
|
|||
return false;
|
||||
}
|
||||
auto epsilon_param = epsilon_node->cast<ParameterPtr>()->default_param();
|
||||
auto epsilon_tensor = std::dynamic_pointer_cast<ParamValueLite>(epsilon_param);
|
||||
auto epsilon_data = reinterpret_cast<float *>(epsilon_tensor->tensor_addr());
|
||||
auto epsilon_shape = epsilon_tensor->tensor_shape();
|
||||
auto epsilon_tensor = std::dynamic_pointer_cast<tensor::Tensor>(epsilon_param);
|
||||
auto epsilon_data = reinterpret_cast<float *>(epsilon_tensor->data_c());
|
||||
auto epsilon_shape = epsilon_tensor->shape();
|
||||
// mean2
|
||||
std::vector<int> mean2_axes;
|
||||
if (!IsReduceNode(equiv, mean2_, mean2_axes_, &mean2_axes)) {
|
||||
|
|
|
@ -17,7 +17,6 @@
|
|||
#include <memory>
|
||||
#include "ops/fusion/activation.h"
|
||||
#include "ops/op_utils.h"
|
||||
#include "src/param_value_lite.h"
|
||||
#include "utils/utils.h"
|
||||
#include "tools/optimizer/common/gllo_utils.h"
|
||||
|
||||
|
|
|
@ -21,7 +21,6 @@
|
|||
#include <string>
|
||||
#include "tools/optimizer/fusion/tf_bidirection_gru_fusion.h"
|
||||
#include "schema/inner/model_generated.h"
|
||||
#include "src/param_value_lite.h"
|
||||
#include "backend/optimizer/common/optimizer.h"
|
||||
#include "utils/utils.h"
|
||||
#include "include/errorcode.h"
|
||||
|
|
|
@ -23,6 +23,7 @@
|
|||
#include "ops/stack.h"
|
||||
#include "ops/transpose.h"
|
||||
#include "src/common/utils.h"
|
||||
#include "tools/common/tensor_util.h"
|
||||
#include "utils/utils.h"
|
||||
#include "securec/include/securec.h"
|
||||
|
||||
|
@ -197,7 +198,7 @@ AnfNodePtr TfBidirectionGruFusion::GetBodyGraphPattern(const PrimitiveVarMapPtr
|
|||
return pattern;
|
||||
}
|
||||
|
||||
ParamValueLitePtr TfBidirectionGruFusion::GetDefaultParamValue(const AnfNodePtr ¶meter_anf) const {
|
||||
tensor::TensorPtr TfBidirectionGruFusion::GetDefaultTensorInfo(const AnfNodePtr ¶meter_anf) const {
|
||||
MS_ASSERT(parameter_anf != nullptr);
|
||||
if (!utils::isa<ParameterPtr>(parameter_anf)) {
|
||||
MS_LOG(DEBUG) << "parameter_anf is not ParameterPtr";
|
||||
|
@ -208,8 +209,8 @@ ParamValueLitePtr TfBidirectionGruFusion::GetDefaultParamValue(const AnfNodePtr
|
|||
MS_LOG(DEBUG) << "parameter not have default value";
|
||||
return nullptr;
|
||||
}
|
||||
auto param_value = std::dynamic_pointer_cast<ParamValueLite>(parameter->default_param());
|
||||
return param_value;
|
||||
auto tensor_info = std::dynamic_pointer_cast<tensor::Tensor>(parameter->default_param());
|
||||
return tensor_info;
|
||||
}
|
||||
|
||||
STATUS TfBidirectionGruFusion::GetInputAndHiddenSize(const AnfNodePtr &fw_cand_kernel_anf,
|
||||
|
@ -219,19 +220,19 @@ STATUS TfBidirectionGruFusion::GetInputAndHiddenSize(const AnfNodePtr &fw_cand_k
|
|||
MS_ASSERT(bw_cand_kernel != nullptr);
|
||||
MS_ASSERT(input_size != nullptr);
|
||||
MS_ASSERT(hidden_size != nullptr);
|
||||
auto fw_cand_kernel_value = GetDefaultParamValue(fw_cand_kernel_anf);
|
||||
auto fw_cand_kernel_value = GetDefaultTensorInfo(fw_cand_kernel_anf);
|
||||
if (fw_cand_kernel_value == nullptr) {
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto fw_cand_kernel_shape = fw_cand_kernel_value->tensor_shape();
|
||||
auto fw_cand_kernel_shape = fw_cand_kernel_value->shape();
|
||||
if (fw_cand_kernel_shape.size() != 2) {
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto bw_cand_kernel_value = GetDefaultParamValue(bw_cand_kernel_anf);
|
||||
auto bw_cand_kernel_value = GetDefaultTensorInfo(bw_cand_kernel_anf);
|
||||
if (bw_cand_kernel_value == nullptr) {
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto bw_cand_kernel_shape = bw_cand_kernel_value->tensor_shape();
|
||||
auto bw_cand_kernel_shape = bw_cand_kernel_value->shape();
|
||||
if (bw_cand_kernel_shape.size() != 2) {
|
||||
return RET_ERROR;
|
||||
}
|
||||
|
@ -261,32 +262,13 @@ ParameterPtr TfBidirectionGruFusion::AddDefaultParameter(const FuncGraphPtr &fun
|
|||
}
|
||||
parameter->set_abstract(abstract_tensor);
|
||||
|
||||
auto gate_weight_default = std::make_shared<ParamValueLite>();
|
||||
auto gate_weight_default = std::make_shared<tensor::Tensor>(type, shape_vector);
|
||||
if (gate_weight_default == nullptr) {
|
||||
MS_LOG(ERROR) << "gate_weight_default is nullptr";
|
||||
return nullptr;
|
||||
}
|
||||
gate_weight_default->set_tensor_shape(shape);
|
||||
gate_weight_default->set_tensor_type(type);
|
||||
gate_weight_default->set_format(schema::Format_NHWC);
|
||||
int data_len = std::accumulate(shape.begin(), shape.end(), 1, std::multiplies<int>());
|
||||
int data_size = 0;
|
||||
if (type == kNumberTypeFloat32 || type == kNumberTypeFloat) {
|
||||
data_size = data_len * sizeof(float);
|
||||
*tensor_data = new (std::nothrow) float[data_len];
|
||||
} else if (type == kNumberTypeInt || type == kNumberTypeInt32) {
|
||||
data_size = data_len * sizeof(int);
|
||||
*tensor_data = new (std::nothrow) int[data_len];
|
||||
} else {
|
||||
MS_LOG(DEBUG) << "unsupported data type";
|
||||
return nullptr;
|
||||
}
|
||||
if (*tensor_data == nullptr) {
|
||||
MS_LOG(ERROR) << "new data failed";
|
||||
return nullptr;
|
||||
}
|
||||
|
||||
gate_weight_default->SetTensorData(*tensor_data, data_size);
|
||||
*tensor_data = gate_weight_default->data_c();
|
||||
parameter->set_default_param(gate_weight_default);
|
||||
return parameter;
|
||||
}
|
||||
|
@ -317,27 +299,27 @@ STATUS TfBidirectionGruFusion::ConvertWeightData(const AnfNodePtr &gate_weight,
|
|||
MS_ASSERT(cand_weight != nullptr);
|
||||
MS_ASSERT(gate_tensor_data != nullptr);
|
||||
MS_ASSERT(recu_tensor_data != nullptr);
|
||||
const std::vector<int> gate_shape{input_size + hidden_size, hidden_size * 2};
|
||||
const std::vector<int> cand_shape{hidden_size * 2, hidden_size};
|
||||
auto gate_weight_value = GetDefaultParamValue(gate_weight);
|
||||
const std::vector<int64_t> gate_shape{input_size + hidden_size, hidden_size * 2};
|
||||
const std::vector<int64_t> cand_shape{hidden_size * 2, hidden_size};
|
||||
auto gate_weight_value = GetDefaultTensorInfo(gate_weight);
|
||||
if (gate_weight_value == nullptr) {
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto gate_weight_data = reinterpret_cast<float *>(gate_weight_value->tensor_addr());
|
||||
auto gate_weight_data = reinterpret_cast<float *>(gate_weight_value->data_c());
|
||||
if (gate_weight_data == nullptr) {
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto gate_weight_shape = gate_weight_value->tensor_shape();
|
||||
auto gate_weight_shape = gate_weight_value->shape();
|
||||
|
||||
auto cand_weight_value = GetDefaultParamValue(cand_weight);
|
||||
auto cand_weight_value = GetDefaultTensorInfo(cand_weight);
|
||||
if (cand_weight_value == nullptr) {
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto cand_weight_data = reinterpret_cast<float *>(cand_weight_value->tensor_addr());
|
||||
auto cand_weight_data = reinterpret_cast<float *>(cand_weight_value->data_c());
|
||||
if (cand_weight_data == nullptr) {
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto cand_weight_shape = cand_weight_value->tensor_shape();
|
||||
auto cand_weight_shape = cand_weight_value->shape();
|
||||
|
||||
if (gate_weight_shape != gate_shape || cand_weight_shape != cand_shape) {
|
||||
return RET_ERROR;
|
||||
|
@ -369,20 +351,20 @@ STATUS TfBidirectionGruFusion::ConvertBiasData(const AnfNodePtr &gate_bias, cons
|
|||
const int hidden_size, float *tensor_data) const {
|
||||
MS_ASSERT(bias != nullptr);
|
||||
MS_ASSERT(tensor_data != nullptr);
|
||||
std::vector<int> gate_shape{hidden_size * 2};
|
||||
std::vector<int> cand_shape{hidden_size};
|
||||
auto gate_bias_value = GetDefaultParamValue(gate_bias);
|
||||
std::vector<int64_t> gate_shape{hidden_size * 2};
|
||||
std::vector<int64_t> cand_shape{hidden_size};
|
||||
auto gate_bias_value = GetDefaultTensorInfo(gate_bias);
|
||||
if (gate_bias_value == nullptr) {
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto gate_bias_data = reinterpret_cast<float *>(gate_bias_value->tensor_addr());
|
||||
auto gate_bias_shape = gate_bias_value->tensor_shape();
|
||||
auto cand_bias_value = GetDefaultParamValue(cand_bias);
|
||||
auto gate_bias_data = reinterpret_cast<float *>(gate_bias_value->data_c());
|
||||
auto gate_bias_shape = gate_bias_value->shape();
|
||||
auto cand_bias_value = GetDefaultTensorInfo(cand_bias);
|
||||
if (cand_bias_value == nullptr) {
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto cand_bias_data = reinterpret_cast<float *>(cand_bias_value->tensor_addr());
|
||||
auto cand_bias_shape = cand_bias_value->tensor_shape();
|
||||
auto cand_bias_data = reinterpret_cast<float *>(cand_bias_value->data_c());
|
||||
auto cand_bias_shape = cand_bias_value->shape();
|
||||
if (gate_bias_shape != gate_shape || cand_bias_shape != cand_shape) {
|
||||
return RET_ERROR;
|
||||
}
|
||||
|
@ -504,6 +486,8 @@ CNodePtr TfBidirectionGruFusion::CreateBiDirectionGruNode(const FuncGraphPtr &fu
|
|||
std::vector<AnfNodePtr> new_node_inputs = {value_node, input, gate_weight, recu_weight,
|
||||
bias, stacked_hidden, input_length};
|
||||
auto new_node = func_graph->NewCNode(new_node_inputs);
|
||||
auto prim = GetValueNode<PrimitivePtr>(new_node->input(0));
|
||||
prim->AddAttr(opt::kWeightFormat, MakeValue<int64_t>(Format::NHWC));
|
||||
new_node->set_fullname_with_scope(base_name);
|
||||
return new_node;
|
||||
}
|
||||
|
|
|
@ -21,7 +21,6 @@
|
|||
#include "tools/optimizer/fusion/tflite_lstm_cell_fusion.h"
|
||||
#include "tools/optimizer/common/gllo_utils.h"
|
||||
#include "schema/inner/model_generated.h"
|
||||
#include "src/param_value_lite.h"
|
||||
#include "backend/optimizer/common/optimizer.h"
|
||||
#include "utils/utils.h"
|
||||
#include "include/errorcode.h"
|
||||
|
@ -48,7 +47,7 @@ class TfBidirectionGruFusion : public PatternProcessPass {
|
|||
private:
|
||||
AnfNodePtr GetCondGraphPattern(const PrimitiveVarMapPtr &primitive_vars) const;
|
||||
|
||||
ParamValueLitePtr GetDefaultParamValue(const AnfNodePtr ¶meter_anf) const;
|
||||
tensor::TensorPtr GetDefaultTensorInfo(const AnfNodePtr ¶meter_anf) const;
|
||||
lite::STATUS GetInputAndHiddenSize(const AnfNodePtr &fw_cand_kernel_anf, const AnfNodePtr &bw_cand_kernel_anf,
|
||||
int *input_size, int *hidden_size) const;
|
||||
ParameterPtr AddDefaultParameter(const FuncGraphPtr &func_graph, const std::string &name,
|
||||
|
|
|
@ -17,7 +17,7 @@
|
|||
#include <memory>
|
||||
#include "ops/lstm.h"
|
||||
#include "src/common/utils.h"
|
||||
#include "src/param_value_lite.h"
|
||||
#include "tools/common/tensor_util.h"
|
||||
#include "utils/utils.h"
|
||||
#include "tools/optimizer/common/gllo_utils.h"
|
||||
#include "securec/include/securec.h"
|
||||
|
@ -110,19 +110,10 @@ AnfNodePtr TfLstmCellFusion::GetBodyGraphPattern(const PrimitiveVarMapPtr &primi
|
|||
return pattern;
|
||||
}
|
||||
|
||||
STATUS TfLstmCellFusion::SetWeightAbstractAndDefault(const ParameterPtr &weight, const std::vector<int> &shape,
|
||||
STATUS TfLstmCellFusion::SetWeightAbstractAndDefault(const ParameterPtr &weight, const std::vector<int64_t> &shape,
|
||||
const float *const data_ptr, const int hidden_size) const {
|
||||
MS_ASSERT(weight != nullptr);
|
||||
MS_ASSERT(data_ptr != nullptr);
|
||||
auto default_param = std::make_shared<ParamValueLite>();
|
||||
if (default_param == nullptr) {
|
||||
MS_LOG(ERROR) << "new_default is nullptr";
|
||||
return RET_ERROR;
|
||||
}
|
||||
default_param->set_tensor_shape(shape);
|
||||
default_param->set_tensor_type(kNumberTypeFloat32);
|
||||
default_param->set_format(schema::Format_NHWC);
|
||||
|
||||
if (shape.size() != 3) {
|
||||
MS_LOG(ERROR) << "lstm weight shape must have 3 dims";
|
||||
return RET_ERROR;
|
||||
|
@ -141,16 +132,17 @@ STATUS TfLstmCellFusion::SetWeightAbstractAndDefault(const ParameterPtr &weight,
|
|||
}
|
||||
}
|
||||
}
|
||||
default_param->SetTensorData(tensor_data, param_num * 4);
|
||||
weight->set_default_param(default_param);
|
||||
std::vector<int64_t> shape_vector_i(shape.begin(), shape.end());
|
||||
auto abstract_tensor_i = std::make_shared<abstract::AbstractTensor>(kFloat32, shape_vector_i);
|
||||
if (abstract_tensor_i == nullptr) {
|
||||
MS_LOG(ERROR) << "abstract_tensor is nullptr";
|
||||
delete[] tensor_data;
|
||||
auto tensor_info = lite::CreateTensorInfo(tensor_data, param_num * 4, shape, kNumberTypeFloat32);
|
||||
delete[] tensor_data;
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "create tensor info failed.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto status = lite::InitParameterFromTensorInfo(weight, tensor_info);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "init parameter from tensor info failed";
|
||||
return RET_ERROR;
|
||||
}
|
||||
weight->set_abstract(abstract_tensor_i);
|
||||
return RET_OK;
|
||||
}
|
||||
|
||||
|
@ -169,17 +161,17 @@ STATUS TfLstmCellFusion::SplitWeights(const AnfNodePtr &weight, const ParameterP
|
|||
MS_LOG(DEBUG) << "weight not have default value";
|
||||
return RET_ERROR;
|
||||
}
|
||||
if (!utils::isa<ParamValueLitePtr>(weight_param->default_param())) {
|
||||
MS_LOG(DEBUG) << "default value is not ParamValueLite";
|
||||
if (!utils::isa<tensor::TensorPtr>(weight_param->default_param())) {
|
||||
MS_LOG(DEBUG) << "default value is not tensor::Tensor";
|
||||
return RET_FAILED;
|
||||
}
|
||||
auto origin_tensor = std::dynamic_pointer_cast<ParamValueLite>(weight_param->default_param());
|
||||
if (origin_tensor->tensor_type() != kNumberTypeFloat32 && origin_tensor->tensor_type() != kNumberTypeFloat) {
|
||||
auto origin_tensor = std::dynamic_pointer_cast<tensor::Tensor>(weight_param->default_param());
|
||||
if (origin_tensor->data_type() != kNumberTypeFloat32 && origin_tensor->data_type() != kNumberTypeFloat) {
|
||||
MS_LOG(DEBUG) << "origin_tensor is not float32 type";
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto data_ptr = reinterpret_cast<float *>(origin_tensor->tensor_addr());
|
||||
auto data_shape = origin_tensor->tensor_shape();
|
||||
auto data_ptr = reinterpret_cast<float *>(origin_tensor->data_c());
|
||||
auto data_shape = origin_tensor->shape();
|
||||
if (data_shape.size() != 2) {
|
||||
MS_LOG(ERROR) << "weight data shape invalid";
|
||||
return RET_ERROR;
|
||||
|
@ -194,13 +186,13 @@ STATUS TfLstmCellFusion::SplitWeights(const AnfNodePtr &weight, const ParameterP
|
|||
}
|
||||
const auto input_size = data_shape[0] - hidden_size;
|
||||
|
||||
std::vector<int> shape_i{1, 4 * hidden_size, input_size};
|
||||
std::vector<int64_t> shape_i{1, 4 * hidden_size, input_size};
|
||||
if (SetWeightAbstractAndDefault(weight_i, shape_i, data_ptr, hidden_size) != RET_OK) {
|
||||
MS_LOG(ERROR) << "get weight_i failed";
|
||||
return RET_ERROR;
|
||||
}
|
||||
|
||||
std::vector<int> shape_c{1, 4 * hidden_size, hidden_size};
|
||||
std::vector<int64_t> shape_c{1, 4 * hidden_size, hidden_size};
|
||||
if (SetWeightAbstractAndDefault(weight_c, shape_c, data_ptr + input_size * data_shape[1], hidden_size) != RET_OK) {
|
||||
MS_LOG(ERROR) << "get weight_i failed";
|
||||
return RET_ERROR;
|
||||
|
@ -222,32 +214,23 @@ STATUS TfLstmCellFusion::PopulateBiasNode(const EquivPtr &body_equiv, const Para
|
|||
MS_LOG(DEBUG) << "bias not have default value";
|
||||
return RET_ERROR;
|
||||
}
|
||||
if (!utils::isa<ParamValueLitePtr>(old_bias_param->default_param())) {
|
||||
MS_LOG(DEBUG) << "default value is not ParamValueLite";
|
||||
if (!utils::isa<tensor::TensorPtr>(old_bias_param->default_param())) {
|
||||
MS_LOG(DEBUG) << "default value is not tensor::Tensor";
|
||||
return RET_FAILED;
|
||||
}
|
||||
auto origin_tensor = std::dynamic_pointer_cast<ParamValueLite>(old_bias_param->default_param());
|
||||
if (origin_tensor->tensor_type() != kNumberTypeFloat32 && origin_tensor->tensor_type() != kNumberTypeFloat) {
|
||||
auto origin_tensor = std::dynamic_pointer_cast<tensor::Tensor>(old_bias_param->default_param());
|
||||
if (origin_tensor->data_type() != kNumberTypeFloat32 && origin_tensor->data_type() != kNumberTypeFloat) {
|
||||
MS_LOG(DEBUG) << "origin_tensor is not float32 type";
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto data_ptr = reinterpret_cast<float *>(origin_tensor->tensor_addr());
|
||||
auto data_shape = origin_tensor->tensor_shape();
|
||||
auto data_ptr = reinterpret_cast<float *>(origin_tensor->data_c());
|
||||
auto data_shape = origin_tensor->shape();
|
||||
if (data_shape.size() != 1 || data_shape[0] != 4 * hidden_size) {
|
||||
MS_LOG(DEBUG) << "bias data shape illegal";
|
||||
return RET_ERROR;
|
||||
}
|
||||
std::vector<int> shape{1, 8 * hidden_size};
|
||||
|
||||
auto default_param = std::make_shared<ParamValueLite>();
|
||||
if (default_param == nullptr) {
|
||||
MS_LOG(ERROR) << "new_default is nullptr";
|
||||
return RET_ERROR;
|
||||
}
|
||||
default_param->set_tensor_shape(shape);
|
||||
default_param->set_tensor_type(kNumberTypeFloat32);
|
||||
default_param->set_format(schema::Format_NHWC);
|
||||
|
||||
std::vector<int64_t> shape{1, 8 * hidden_size};
|
||||
std::unique_ptr<float[]> tensor_data(new (std::nothrow) float[hidden_size * 8]);
|
||||
|
||||
auto forget_bias_node = utils::cast<AnfNodePtr>((*body_equiv)[forget_bias_]);
|
||||
|
@ -256,7 +239,7 @@ STATUS TfLstmCellFusion::PopulateBiasNode(const EquivPtr &body_equiv, const Para
|
|||
return RET_ERROR;
|
||||
}
|
||||
float forget_bias_value = 0.0f;
|
||||
if (GetFloatScalarFromParamValueLite(forget_bias_node, &forget_bias_value) != RET_OK) {
|
||||
if (GetFloatScalarFromTensorInfo(forget_bias_node, &forget_bias_value) != RET_OK) {
|
||||
return RET_ERROR;
|
||||
}
|
||||
|
||||
|
@ -273,15 +256,19 @@ STATUS TfLstmCellFusion::PopulateBiasNode(const EquivPtr &body_equiv, const Para
|
|||
}
|
||||
}
|
||||
}
|
||||
default_param->SetTensorData(tensor_data.release(), hidden_size * 8 * 4);
|
||||
new_bias->set_default_param(default_param);
|
||||
std::vector<int64_t> shape_vector_i(shape.begin(), shape.end());
|
||||
auto abstract_tensor_i = std::make_shared<abstract::AbstractTensor>(kFloat32, shape_vector_i);
|
||||
if (abstract_tensor_i == nullptr) {
|
||||
MS_LOG(ERROR) << "abstract_tensor is nullptr";
|
||||
|
||||
auto tensor_info = lite::CreateTensorInfo(tensor_data.get(), hidden_size * 8 * 4, shape, kNumberTypeFloat32);
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "create tensor info failed.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
new_bias->set_abstract(abstract_tensor_i);
|
||||
|
||||
auto status = lite::InitParameterFromTensorInfo(new_bias, tensor_info);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "init parameter from tensor info failed";
|
||||
return RET_ERROR;
|
||||
}
|
||||
|
||||
return RET_OK;
|
||||
}
|
||||
|
||||
|
|
|
@ -22,7 +22,6 @@
|
|||
#include "tools/optimizer/fusion/tflite_lstm_cell_fusion.h"
|
||||
#include "backend/optimizer/common/optimizer.h"
|
||||
#include "utils/utils.h"
|
||||
#include "src/param_value_lite.h"
|
||||
#include "include/errorcode.h"
|
||||
|
||||
namespace mindspore {
|
||||
|
@ -40,7 +39,7 @@ class TfLstmCellFusion : public TfliteLstmCellFusion {
|
|||
|
||||
lite::STATUS SplitWeights(const AnfNodePtr &weight, const ParameterPtr &weight_i, const ParameterPtr &weight_c,
|
||||
int hidden_size) const;
|
||||
lite::STATUS SetWeightAbstractAndDefault(const ParameterPtr &weight, const std::vector<int> &shape,
|
||||
lite::STATUS SetWeightAbstractAndDefault(const ParameterPtr &weight, const std::vector<int64_t> &shape,
|
||||
const float *const data_ptr, const int hidden_size) const;
|
||||
lite::STATUS PopulateBiasNode(const EquivPtr &body_equiv, const ParameterPtr &new_bias, const AnfNodePtr &old_bias,
|
||||
const int hidden_size) const;
|
||||
|
|
|
@ -14,15 +14,14 @@
|
|||
* limitations under the License.
|
||||
*/
|
||||
#include "tools/optimizer/fusion/tflite_lstm_cell_fusion.h"
|
||||
#include <algorithm>
|
||||
#include <memory>
|
||||
#include <algorithm>
|
||||
#include <functional>
|
||||
#include "ops/lstm.h"
|
||||
#include "ops/squeeze.h"
|
||||
#include "ops/tuple_get_item.h"
|
||||
#include "src/common/utils.h"
|
||||
#include "src/param_value_lite.h"
|
||||
#include "schema/inner/model_generated.h"
|
||||
#include "tools/common/tensor_util.h"
|
||||
#include "utils/utils.h"
|
||||
#include "tools/optimizer/common/gllo_utils.h"
|
||||
#include "securec/include/securec.h"
|
||||
|
@ -51,36 +50,36 @@ bool IsOpType(const BaseRef &n, const PrimitivePtr &prim) {
|
|||
}
|
||||
} // namespace
|
||||
|
||||
STATUS TfliteLstmCellFusion::GetFloatScalarFromParamValueLite(const AnfNodePtr ¶m_value, float *v) const {
|
||||
if (param_value == nullptr || v == nullptr) {
|
||||
MS_LOG(ERROR) << "param_value or v is nullptr";
|
||||
STATUS TfliteLstmCellFusion::GetFloatScalarFromTensorInfo(const AnfNodePtr &tensor_info, float *v) const {
|
||||
if (tensor_info == nullptr || v == nullptr) {
|
||||
MS_LOG(ERROR) << "tensor_info or v is nullptr";
|
||||
return RET_ERROR;
|
||||
}
|
||||
if (!utils::isa<ParameterPtr>(param_value)) {
|
||||
MS_LOG(DEBUG) << "param_value is not ParamValueLitePtr";
|
||||
if (!utils::isa<ParameterPtr>(tensor_info)) {
|
||||
MS_LOG(DEBUG) << "tensor_info is not tensor::TensorPtr";
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto param_ptr = utils::cast<ParameterPtr>(param_value);
|
||||
auto param_ptr = utils::cast<ParameterPtr>(tensor_info);
|
||||
if (!param_ptr->has_default()) {
|
||||
MS_LOG(DEBUG) << "param not have default";
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto default_param = param_ptr->default_param();
|
||||
if (!utils::isa<ParamValueLitePtr>(default_param)) {
|
||||
MS_LOG(DEBUG) << "param_value is not ParamValueLitePtr";
|
||||
if (!utils::isa<tensor::TensorPtr>(default_param)) {
|
||||
MS_LOG(DEBUG) << "tensor_info is not tensor::TensorPtr";
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto default_param_ptr = utils::cast<ParamValueLitePtr>(default_param);
|
||||
auto tensor_shape = default_param_ptr->tensor_shape();
|
||||
auto default_param_ptr = utils::cast<tensor::TensorPtr>(default_param);
|
||||
auto tensor_shape = default_param_ptr->shape();
|
||||
if (!(tensor_shape.size() == 0 || (tensor_shape.size() == 1 && tensor_shape[0] == 1))) {
|
||||
MS_LOG(DEBUG) << "default param is not scalar";
|
||||
return RET_ERROR;
|
||||
}
|
||||
if (default_param_ptr->tensor_type() != kNumberTypeFloat32 && default_param_ptr->tensor_type() != kNumberTypeFloat) {
|
||||
if (default_param_ptr->data_type() != kNumberTypeFloat32 && default_param_ptr->data_type() != kNumberTypeFloat) {
|
||||
MS_LOG(DEBUG) << "default param is not float";
|
||||
return RET_ERROR;
|
||||
}
|
||||
*v = *(reinterpret_cast<float *>(default_param_ptr->tensor_addr()));
|
||||
*v = *(reinterpret_cast<float *>(default_param_ptr->data_c()));
|
||||
return RET_OK;
|
||||
}
|
||||
|
||||
|
@ -278,16 +277,16 @@ bool TfliteLstmCellFusion::CheckBodyGraph(const FuncGraphPtr &func_graph, const
|
|||
MS_ASSERT(hidden_zoneout_new_node != nullptr);
|
||||
|
||||
float cell_old, cell_new, hidden_old, hidden_new;
|
||||
if (GetFloatScalarFromParamValueLite(cell_zoneout_old_node, &cell_old) != RET_OK) {
|
||||
if (GetFloatScalarFromTensorInfo(cell_zoneout_old_node, &cell_old) != RET_OK) {
|
||||
return false;
|
||||
}
|
||||
if (GetFloatScalarFromParamValueLite(cell_zoneout_new_node, &cell_new) != RET_OK) {
|
||||
if (GetFloatScalarFromTensorInfo(cell_zoneout_new_node, &cell_new) != RET_OK) {
|
||||
return false;
|
||||
}
|
||||
if (GetFloatScalarFromParamValueLite(hidden_zoneout_old_node, &hidden_old) != RET_OK) {
|
||||
if (GetFloatScalarFromTensorInfo(hidden_zoneout_old_node, &hidden_old) != RET_OK) {
|
||||
return false;
|
||||
}
|
||||
if (GetFloatScalarFromParamValueLite(hidden_zoneout_new_node, &hidden_new) != RET_OK) {
|
||||
if (GetFloatScalarFromTensorInfo(hidden_zoneout_new_node, &hidden_new) != RET_OK) {
|
||||
return false;
|
||||
}
|
||||
if (cell_old < 0.0f || cell_old > 1.0f || cell_new < 0.0f || cell_new > 1.0f) {
|
||||
|
@ -313,7 +312,7 @@ STATUS TfliteLstmCellFusion::GetConcatedParam(const std::vector<AnfNodePtr> &par
|
|||
MS_ASSERT(new_param != nullptr);
|
||||
MS_ASSERT(params.size() == 4);
|
||||
std::vector<float *> data_ptrs;
|
||||
std::vector<std::vector<int>> data_shapes;
|
||||
std::vector<std::vector<int64_t>> data_shapes;
|
||||
for (auto ¶m : params) {
|
||||
if (!utils::isa<ParameterPtr>(param)) {
|
||||
MS_LOG(DEBUG) << "param is not Parameter node";
|
||||
|
@ -324,17 +323,17 @@ STATUS TfliteLstmCellFusion::GetConcatedParam(const std::vector<AnfNodePtr> &par
|
|||
MS_LOG(DEBUG) << "param not have default value";
|
||||
return RET_FAILED;
|
||||
}
|
||||
if (!utils::isa<ParamValueLitePtr>(param_t->default_param())) {
|
||||
MS_LOG(DEBUG) << "default value is not ParamValueLite";
|
||||
if (!utils::isa<tensor::TensorPtr>(param_t->default_param())) {
|
||||
MS_LOG(DEBUG) << "default value is not tensor::Tensor";
|
||||
return RET_FAILED;
|
||||
}
|
||||
auto origin_tensor = std::dynamic_pointer_cast<ParamValueLite>(param_t->default_param());
|
||||
if (origin_tensor->tensor_type() != kNumberTypeFloat32 && origin_tensor->tensor_type() != kNumberTypeFloat) {
|
||||
auto origin_tensor = std::dynamic_pointer_cast<tensor::Tensor>(param_t->default_param());
|
||||
if (origin_tensor->data_type() != kNumberTypeFloat32 && origin_tensor->data_type() != kNumberTypeFloat) {
|
||||
MS_LOG(DEBUG) << "origin_tensor is not float32 type";
|
||||
return RET_FAILED;
|
||||
}
|
||||
auto data_ptr = reinterpret_cast<float *>(origin_tensor->tensor_addr());
|
||||
auto data_shape = origin_tensor->tensor_shape();
|
||||
auto data_ptr = reinterpret_cast<float *>(origin_tensor->data_c());
|
||||
auto data_shape = origin_tensor->shape();
|
||||
data_ptrs.push_back(data_ptr);
|
||||
data_shapes.push_back(data_shape);
|
||||
}
|
||||
|
@ -345,13 +344,7 @@ STATUS TfliteLstmCellFusion::GetConcatedParam(const std::vector<AnfNodePtr> &par
|
|||
return RET_FAILED;
|
||||
}
|
||||
}
|
||||
auto new_default = std::make_shared<ParamValueLite>();
|
||||
if (new_default == nullptr) {
|
||||
MS_LOG(ERROR) << "new_default is nullptr";
|
||||
return RET_ERROR;
|
||||
}
|
||||
std::vector<int> new_shape;
|
||||
float *tensor_data = nullptr;
|
||||
std::vector<int64_t> new_shape;
|
||||
int step = 0;
|
||||
int data_size = 0;
|
||||
if (is_bias) {
|
||||
|
@ -361,23 +354,25 @@ STATUS TfliteLstmCellFusion::GetConcatedParam(const std::vector<AnfNodePtr> &par
|
|||
}
|
||||
step = data_shapes[0][0];
|
||||
data_size = 8 * step;
|
||||
new_shape = std::vector<int>({1, data_size});
|
||||
new_shape = std::vector<int64_t>({1, data_size});
|
||||
|
||||
} else {
|
||||
if (data_shapes[0].size() != 2) {
|
||||
MS_LOG(ERROR) << "weight data shape error";
|
||||
return RET_ERROR;
|
||||
}
|
||||
new_shape = std::vector<int>({1, data_shapes[0][0] * 4, data_shapes[0][1]});
|
||||
new_shape = std::vector<int64_t>({1, data_shapes[0][0] * 4, data_shapes[0][1]});
|
||||
step = data_shapes[0][0] * data_shapes[0][1];
|
||||
data_size = 4 * step;
|
||||
}
|
||||
|
||||
tensor_data = new (std::nothrow) float[data_size];
|
||||
if (tensor_data == nullptr) {
|
||||
MS_LOG(ERROR) << "new data failed";
|
||||
auto tensor_info = lite::CreateTensorInfo(nullptr, 0, new_shape, kNumberTypeFloat32);
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "create tensor info failed.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
|
||||
auto tensor_data = static_cast<float *>(tensor_info->data_c());
|
||||
for (int i = 0; i < data_size; ++i) { // bias are stored into first 4*hidden_size buffer, the rest is all 0
|
||||
tensor_data[i] = 0.0f;
|
||||
}
|
||||
|
@ -387,23 +382,16 @@ STATUS TfliteLstmCellFusion::GetConcatedParam(const std::vector<AnfNodePtr> &par
|
|||
auto ret = memcpy_s(tensor_data + i * step, step * sizeof(float), data_ptrs[i], source_len * sizeof(float));
|
||||
if (ret != EOK) {
|
||||
MS_LOG(ERROR) << "memcpy_s error";
|
||||
delete[] tensor_data;
|
||||
return RET_ERROR;
|
||||
}
|
||||
}
|
||||
new_default->set_tensor_shape(new_shape);
|
||||
new_default->set_tensor_type(kNumberTypeFloat32);
|
||||
new_default->set_format(schema::Format_NHWC);
|
||||
new_default->SetTensorData(tensor_data, data_size * sizeof(float));
|
||||
new_param->set_default_param(new_default);
|
||||
|
||||
std::vector<int64_t> shape_vector(new_shape.begin(), new_shape.end());
|
||||
auto abstract_tensor = std::make_shared<abstract::AbstractTensor>(kFloat32, shape_vector);
|
||||
if (abstract_tensor == nullptr) {
|
||||
MS_LOG(ERROR) << "abstract_tensor is nullptr";
|
||||
auto status = lite::InitParameterFromTensorInfo(new_param, tensor_info);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "init parameter from tensor info failed";
|
||||
return RET_ERROR;
|
||||
}
|
||||
new_param->set_abstract(abstract_tensor);
|
||||
|
||||
return RET_OK;
|
||||
}
|
||||
|
||||
|
|
|
@ -50,7 +50,7 @@ class TfliteLstmCellFusion : public PatternProcessPass {
|
|||
VarPtr hidden_zoneout_new_ = nullptr;
|
||||
std::vector<VarPtr> while_input_vars_;
|
||||
|
||||
lite::STATUS GetFloatScalarFromParamValueLite(const AnfNodePtr ¶m_value, float *v) const;
|
||||
lite::STATUS GetFloatScalarFromTensorInfo(const AnfNodePtr &tensor_info, float *v) const;
|
||||
CNodePtr CreateSqueezeNode(const FuncGraphPtr &func_graph, const CNodePtr &input_node,
|
||||
const std::vector<int> &axis) const;
|
||||
lite::STATUS AdjustOtherGetItems(const FuncGraphPtr &func_graph, const CNodePtr &while_cnode,
|
||||
|
|
|
@ -54,23 +54,23 @@ bool ClipConvertActivationPass::Run(const FuncGraphPtr &graph) {
|
|||
}
|
||||
if ((min == -1) && (max == -1)) {
|
||||
if (clip_cnode->size() > kClipMinIndex) {
|
||||
auto min_param_value = GetLiteParamValue(clip_cnode->input(kClipMinIndex));
|
||||
if (min_param_value->tensor_type() != mindspore::kNumberTypeFloat32) {
|
||||
auto min_tensor_info = GetTensorInfo(clip_cnode->input(kClipMinIndex));
|
||||
if (min_tensor_info->data_type() != mindspore::kNumberTypeFloat32) {
|
||||
MS_LOG(ERROR) << "Clip param type invalid";
|
||||
return false;
|
||||
}
|
||||
min = *reinterpret_cast<float *>(min_param_value->tensor_addr());
|
||||
min = *reinterpret_cast<float *>(min_tensor_info->data_c());
|
||||
} else {
|
||||
min = FLT_MIN;
|
||||
}
|
||||
|
||||
if (clip_cnode->size() > kClipMaxIndex) {
|
||||
auto max_param_value = GetLiteParamValue(clip_cnode->input(kClipMaxIndex));
|
||||
if (max_param_value->tensor_type() != mindspore::kNumberTypeFloat32) {
|
||||
auto max_tensor_info = GetTensorInfo(clip_cnode->input(kClipMaxIndex));
|
||||
if (max_tensor_info->data_type() != mindspore::kNumberTypeFloat32) {
|
||||
MS_LOG(ERROR) << "Clip param type invalid";
|
||||
return false;
|
||||
}
|
||||
max = *reinterpret_cast<float *>(max_param_value->tensor_addr());
|
||||
max = *reinterpret_cast<float *>(max_tensor_info->data_c());
|
||||
} else {
|
||||
max = FLT_MAX;
|
||||
}
|
||||
|
|
|
@ -19,7 +19,6 @@
|
|||
#include <string>
|
||||
#include "tools/converter/converter_flags.h"
|
||||
#include "backend/optimizer/common/pass.h"
|
||||
#include "src/param_value_lite.h"
|
||||
|
||||
using mindspore::lite::converter::FmkType;
|
||||
using mindspore::schema::QuantType;
|
||||
|
|
|
@ -23,13 +23,14 @@ namespace {
|
|||
constexpr size_t kTripleNum = 3;
|
||||
constexpr size_t kConvWeightIndex = 2;
|
||||
} // namespace
|
||||
lite::STATUS Conv1DWeightExpandingPass::ExpandFilterShape(const ParamValueLitePtr &tensor) {
|
||||
lite::STATUS Conv1DWeightExpandingPass::ExpandFilterShape(const tensor::TensorPtr &tensor,
|
||||
const schema::Format &format) {
|
||||
if (tensor == nullptr) {
|
||||
return lite::RET_NULL_PTR;
|
||||
}
|
||||
auto shape = tensor->tensor_shape();
|
||||
std::vector<int> new_shape(shape);
|
||||
switch (tensor->format()) {
|
||||
auto shape = tensor->shape();
|
||||
std::vector<int64_t> new_shape(shape);
|
||||
switch (format) {
|
||||
case schema::Format_NCHW:
|
||||
case schema::Format_KCHW:
|
||||
new_shape.insert(new_shape.begin() + 2, 1);
|
||||
|
@ -42,7 +43,7 @@ lite::STATUS Conv1DWeightExpandingPass::ExpandFilterShape(const ParamValueLitePt
|
|||
MS_LOG(ERROR) << "Unsupported format.";
|
||||
return RET_ERROR;
|
||||
}
|
||||
tensor->set_tensor_shape(new_shape);
|
||||
tensor->set_shape(new_shape);
|
||||
return RET_OK;
|
||||
}
|
||||
|
||||
|
@ -61,14 +62,21 @@ bool Conv1DWeightExpandingPass::Run(const FuncGraphPtr &func_graph) {
|
|||
MS_ASSERT(conv_cnode->inputs().size() > kConvWeightIndex);
|
||||
auto weight_node = conv_cnode->input(kConvWeightIndex);
|
||||
MS_ASSERT(weight_node != nullptr);
|
||||
auto weight_value = GetLiteParamValue(weight_node);
|
||||
auto weight_value = GetTensorInfo(weight_node);
|
||||
if (weight_value == nullptr) {
|
||||
MS_LOG(ERROR) << "weight node must be param value.";
|
||||
return false;
|
||||
}
|
||||
auto prim = GetValueNode<PrimitivePtr>(conv_cnode->input(0));
|
||||
MS_ASSERT(prim != nullptr);
|
||||
|
||||
schema::Format schema_format = schema::Format::Format_KCHW;
|
||||
if (prim->GetAttr(opt::kWeightFormat) != nullptr) {
|
||||
schema_format = static_cast<schema::Format>(GetValue<int64_t>(prim->GetAttr(opt::kWeightFormat)));
|
||||
}
|
||||
// expand weight tensor to 4 dimensions.
|
||||
if (weight_value->tensor_shape().size() == kTripleNum) {
|
||||
auto status = ExpandFilterShape(weight_value);
|
||||
if (weight_value->shape().size() == kTripleNum) {
|
||||
auto status = ExpandFilterShape(weight_value, schema_format);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "Expand filter shape failed.";
|
||||
return false;
|
||||
|
|
|
@ -22,7 +22,6 @@
|
|||
#include "backend/optimizer/common/pass.h"
|
||||
#include "tools/optimizer/common/gllo_utils.h"
|
||||
|
||||
using mindspore::ParamValueLitePtr;
|
||||
namespace mindspore::opt {
|
||||
class Conv1DWeightExpandingPass : public Pass {
|
||||
public:
|
||||
|
@ -31,7 +30,7 @@ class Conv1DWeightExpandingPass : public Pass {
|
|||
bool Run(const FuncGraphPtr &graph) override;
|
||||
|
||||
private:
|
||||
lite::STATUS ExpandFilterShape(const ParamValueLitePtr &tensor);
|
||||
lite::STATUS ExpandFilterShape(const tensor::TensorPtr &tensor, const schema::Format &format);
|
||||
};
|
||||
} // namespace mindspore::opt
|
||||
#endif // MINDSPORE_LITE_SRC_PASS_FUSION_CONV1D_WEIGHT_EXPANDING_PASS_H_
|
||||
|
|
|
@ -81,7 +81,7 @@ bool GroupDepthwiseOpConvertPass::Run(const FuncGraphPtr &graph) {
|
|||
MS_ASSERT(conv_cnode->inputs().size() > kConvWeightIndex);
|
||||
auto weight_node = conv_cnode->input(kConvWeightIndex);
|
||||
MS_ASSERT(weight_node != nullptr);
|
||||
auto weight_value = GetLiteParamValue(weight_node);
|
||||
auto weight_value = GetTensorInfo(weight_node);
|
||||
if (weight_value == nullptr) {
|
||||
MS_LOG(ERROR) << "weight node must param value";
|
||||
return false;
|
||||
|
@ -89,19 +89,20 @@ bool GroupDepthwiseOpConvertPass::Run(const FuncGraphPtr &graph) {
|
|||
MS_ASSERT(weight_value->tensor_type() == TypeId::kNumberTypeFloat32 ||
|
||||
weight_value->tensor_type() == TypeId::kNumberTypeInt8);
|
||||
lite::STATUS status;
|
||||
schema::Format weight_dst_format = schema::Format::Format_CHWK;
|
||||
weight_value->set_format(schema::Format_KHWC);
|
||||
status = TransFilterFormat(weight_value, weight_dst_format);
|
||||
auto weight_src_format = schema::Format::Format_KHWC;
|
||||
auto weight_dst_format = schema::Format::Format_CHWK;
|
||||
|
||||
status = TransFilterFormat(weight_value, weight_src_format, weight_dst_format);
|
||||
if (status == RET_OK) {
|
||||
weight_value->set_format(weight_dst_format);
|
||||
conv2d_fusion->AddAttr(opt::kWeightFormat, MakeValue<int64_t>(weight_dst_format));
|
||||
} else {
|
||||
MS_LOG(ERROR) << "TransFilter " << EnumNameFormat(schema::EnumValuesFormat()[weight_value->format()]) << "To"
|
||||
MS_LOG(ERROR) << "TransFilter " << EnumNameFormat(schema::EnumValuesFormat()[weight_dst_format]) << "To"
|
||||
<< EnumNameFormat(weight_dst_format) << " failed, node : " << node->fullname_with_scope();
|
||||
return false;
|
||||
}
|
||||
auto type_id = static_cast<TypeId>(weight_value->tensor_type());
|
||||
auto type_id = static_cast<TypeId>(weight_value->data_type());
|
||||
auto type_ptr = TypeIdToType(type_id);
|
||||
auto shape = weight_value->tensor_shape();
|
||||
auto shape = weight_value->shape();
|
||||
std::vector<int64_t> shape_vector;
|
||||
(void)std::transform(shape.begin(), shape.end(), std::back_inserter(shape_vector),
|
||||
[](const int32_t &value) { return static_cast<int64_t>(value); });
|
||||
|
|
|
@ -18,7 +18,6 @@
|
|||
#include <string>
|
||||
#include "tools/converter/converter_flags.h"
|
||||
#include "backend/optimizer/common/pass.h"
|
||||
#include "src/param_value_lite.h"
|
||||
|
||||
namespace mindspore::opt {
|
||||
class GroupDepthwiseOpConvertPass : public Pass {
|
||||
|
|
|
@ -21,7 +21,6 @@
|
|||
#include "schema/inner/model_generated.h"
|
||||
#include "tools/converter/converter_flags.h"
|
||||
#include "backend/optimizer/common/pass.h"
|
||||
#include "src/param_value_lite.h"
|
||||
|
||||
using mindspore::lite::converter::FmkType;
|
||||
namespace mindspore::opt {
|
||||
|
|
|
@ -19,6 +19,7 @@
|
|||
#include <algorithm>
|
||||
#include "include/errorcode.h"
|
||||
#include "tools/common/node_util.h"
|
||||
#include "tools/common/tensor_util.h"
|
||||
#include "src/common/common.h"
|
||||
#include "src/ops/populate/populate_register.h"
|
||||
#include "src/ops/ops_utils.h"
|
||||
|
@ -27,16 +28,17 @@
|
|||
namespace mindspore::opt {
|
||||
namespace {
|
||||
constexpr size_t INITIAL_SIZE = 1024;
|
||||
ParamValueLitePtr NewParamValueLitePtr(lite::Tensor *tensor) {
|
||||
auto para_value_lite = std::make_shared<ParamValueLite>();
|
||||
if (para_value_lite == nullptr) {
|
||||
MS_LOG(ERROR) << "new ParamValueLite failed";
|
||||
tensor::TensorPtr NewTensorInfo(lite::Tensor *tensor) {
|
||||
std::vector<int> shape(tensor->shape());
|
||||
std::vector<int64_t> shape_vector;
|
||||
std::transform(shape.begin(), shape.end(), std::back_inserter(shape_vector),
|
||||
[](const int32_t &value) { return static_cast<int64_t>(value); });
|
||||
auto tensor_info = std::make_shared<tensor::Tensor>(tensor->data_type(), shape_vector);
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "new tensor::Tensor failed";
|
||||
return nullptr;
|
||||
}
|
||||
para_value_lite->set_tensor_shape(tensor->shape());
|
||||
para_value_lite->set_tensor_type(tensor->data_type());
|
||||
para_value_lite->set_format(tensor->format());
|
||||
return para_value_lite;
|
||||
return tensor_info;
|
||||
}
|
||||
|
||||
bool IsSpecialType(const CNodePtr &cnode) {
|
||||
|
@ -62,9 +64,9 @@ abstract::AbstractTensorPtr InferShapePass::ConvertLiteTensorToAbstractTensor(li
|
|||
return nullptr;
|
||||
}
|
||||
|
||||
auto para_value_lite = NewParamValueLitePtr(tensor);
|
||||
if (para_value_lite == nullptr) {
|
||||
MS_LOG(ERROR) << "new ParamValueLite failed";
|
||||
auto tensor_info = NewTensorInfo(tensor);
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "new tensor::Tensor failed";
|
||||
return nullptr;
|
||||
}
|
||||
|
||||
|
@ -74,76 +76,23 @@ abstract::AbstractTensorPtr InferShapePass::ConvertLiteTensorToAbstractTensor(li
|
|||
MS_LOG(ERROR) << "cast tensor_list failed";
|
||||
return nullptr;
|
||||
}
|
||||
auto tensor_info = new int[tensor_list->element_shape().size() + 2];
|
||||
tensor_info[0] = tensor_list->tensors_data_type();
|
||||
tensor_info[1] = tensor_list->element_shape().size();
|
||||
auto tensor_data = new int[tensor_list->element_shape().size() + 2];
|
||||
tensor_data[0] = tensor_list->tensors_data_type();
|
||||
tensor_data[1] = tensor_list->element_shape().size();
|
||||
for (size_t i = 0; i < tensor_list->element_shape().size(); ++i) {
|
||||
tensor_info[i + 2] = tensor_list->element_shape()[i];
|
||||
tensor_data[i + 2] = tensor_list->element_shape()[i];
|
||||
}
|
||||
auto status = lite::SetTensorData(tensor_info, tensor_data, tensor_list->element_shape().size() + 2);
|
||||
delete[] tensor_data;
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "set tensor data failed";
|
||||
return nullptr;
|
||||
}
|
||||
para_value_lite->set_tensor_addr(tensor_info);
|
||||
para_value_lite->set_tensor_size(tensor_list->element_shape().size() + 2);
|
||||
}
|
||||
|
||||
new_abstract->set_value(para_value_lite);
|
||||
new_abstract->set_value(tensor_info);
|
||||
return new_abstract;
|
||||
}
|
||||
|
||||
STATUS InferShapePass::SetParameterAbstract(const ParameterPtr ¶meter) {
|
||||
MS_ASSERT(parameter != nullptr);
|
||||
auto old_abstract = parameter->abstract();
|
||||
if (old_abstract == nullptr) {
|
||||
MS_LOG(ERROR) << "Abstract of parameter is nullptr, " << parameter->name();
|
||||
return RET_ERROR;
|
||||
}
|
||||
if (!utils::isa<abstract::AbstractTensorPtr>(old_abstract)) {
|
||||
MS_LOG(ERROR) << "Abstract of parameter should be abstract tensor, " << parameter->name();
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto abstract_tensor = utils::cast<abstract::AbstractTensorPtr>(old_abstract);
|
||||
|
||||
auto typePtr = abstract_tensor->element()->GetTypeTrack();
|
||||
if (typePtr == nullptr) {
|
||||
MS_LOG(ERROR) << "typePtr is nullptr";
|
||||
return RET_ERROR;
|
||||
}
|
||||
|
||||
if (!utils::isa<abstract::ShapePtr>(abstract_tensor->BuildShape())) {
|
||||
MS_LOG(ERROR) << "Shape of Abstract of parameter should be ShapePtr, " << parameter->name();
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto shape_vector = utils::cast<abstract::ShapePtr>(abstract_tensor->BuildShape())->shape();
|
||||
std::vector<int32_t> shape;
|
||||
(void)std::transform(shape_vector.begin(), shape_vector.end(), std::back_inserter(shape),
|
||||
[](const int64_t &value) { return static_cast<int32_t>(value); });
|
||||
|
||||
auto new_abstract = std::make_shared<abstract::AbstractTensor>(typePtr, shape_vector);
|
||||
auto new_value = std::make_shared<ParamValueLite>();
|
||||
new_value->set_tensor_shape(shape); // scalar's shape is {}
|
||||
new_value->set_tensor_type(typePtr->type_id());
|
||||
new_value->set_format(schema::Format_NHWC); // default format is NHWC
|
||||
if (parameter->has_default()) {
|
||||
auto param_value = std::dynamic_pointer_cast<ParamValueLite>(parameter->default_param());
|
||||
new_value->set_format(param_value->format());
|
||||
new_value->set_tensor_size(param_value->tensor_size());
|
||||
|
||||
char *tensor_data = new (std::nothrow) char[new_value->tensor_size()];
|
||||
if (tensor_data == nullptr) {
|
||||
MS_LOG(ERROR) << "new char[] failed";
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto ret = memcpy_s(tensor_data, new_value->tensor_size(), param_value->tensor_addr(), param_value->tensor_size());
|
||||
if (new_value->tensor_size() != 0 && ret != EOK) {
|
||||
MS_LOG(ERROR) << "memcpy error: " << ret;
|
||||
delete[] tensor_data;
|
||||
return RET_ERROR;
|
||||
}
|
||||
new_value->SetTensorData(tensor_data, new_value->tensor_size());
|
||||
}
|
||||
new_abstract->set_value(new_value);
|
||||
parameter->set_abstract(new_abstract);
|
||||
return RET_OK;
|
||||
}
|
||||
|
||||
void InferShapePass::FreeTensors(std::vector<lite::Tensor *> *tensors) {
|
||||
for (auto tensor : *tensors) {
|
||||
delete tensor;
|
||||
|
@ -178,18 +127,18 @@ STATUS InferShapePass::GetCNodeInputTensors(const CNodePtr &cnode, std::vector<l
|
|||
return RET_ERROR;
|
||||
}
|
||||
auto abstract_tensor = utils::cast<abstract::AbstractTensorPtr>(abstract);
|
||||
if (!utils::isa<ParamValueLitePtr>(abstract_tensor->GetValueTrack())) { // input node not complete infershape
|
||||
MS_LOG(DEBUG) << "Value of abstract is not ParamValueLite, indicate that infershape has failed";
|
||||
if (!utils::isa<tensor::TensorPtr>(abstract_tensor->GetValueTrack())) { // input node not complete infershape
|
||||
MS_LOG(DEBUG) << "Value of abstract is not tensor::Tensor, indicate that infershape has failed";
|
||||
return RET_ERROR;
|
||||
}
|
||||
auto param_value_lite = utils::cast<ParamValueLitePtr>(abstract_tensor->GetValueTrack());
|
||||
auto param_value_lite = utils::cast<tensor::TensorPtr>(abstract_tensor->GetValueTrack());
|
||||
if (param_value_lite == nullptr) {
|
||||
MS_LOG(ERROR) << "ParamValueLite of abstract is nullptr";
|
||||
MS_LOG(ERROR) << "tensor::Tensor of abstract is nullptr";
|
||||
return RET_ERROR;
|
||||
}
|
||||
|
||||
std::unique_ptr<lite::Tensor> tensor = nullptr;
|
||||
if (param_value_lite->tensor_type() != kObjectTypeTensorType) {
|
||||
if (param_value_lite->data_type() != kObjectTypeTensorType) {
|
||||
tensor = std::make_unique<lite::Tensor>();
|
||||
} else {
|
||||
tensor = std::make_unique<lite::TensorList>();
|
||||
|
@ -198,29 +147,32 @@ STATUS InferShapePass::GetCNodeInputTensors(const CNodePtr &cnode, std::vector<l
|
|||
MS_LOG(ERROR) << "new input tensor failed";
|
||||
return RET_ERROR;
|
||||
}
|
||||
if (param_value_lite->tensor_type() != kObjectTypeTensorType) {
|
||||
tensor->set_shape(param_value_lite->tensor_shape());
|
||||
tensor->set_data_type(param_value_lite->tensor_type());
|
||||
tensor->set_format(schema::Format(param_value_lite->format()));
|
||||
|
||||
std::vector<int> shape;
|
||||
std::transform(param_value_lite->shape().begin(), param_value_lite->shape().end(), std::back_inserter(shape),
|
||||
[](const int64_t &value) { return static_cast<int32_t>(value); });
|
||||
if (param_value_lite->data_type() != kObjectTypeTensorType) {
|
||||
tensor->set_shape(shape);
|
||||
tensor->set_data_type(param_value_lite->data_type());
|
||||
}
|
||||
|
||||
if (utils::isa<ParameterPtr>(input)) {
|
||||
auto parameter = input->cast<ParameterPtr>();
|
||||
if (parameter->has_default()) {
|
||||
auto param_value = std::dynamic_pointer_cast<ParamValueLite>(parameter->default_param());
|
||||
if (param_value_lite->tensor_type() != kObjectTypeTensorType) {
|
||||
auto tensor_info = std::dynamic_pointer_cast<tensor::Tensor>(parameter->default_param());
|
||||
if (param_value_lite->data_type() != kObjectTypeTensorType) {
|
||||
auto ret = tensor->MallocData();
|
||||
if (ret != 0) {
|
||||
MS_LOG(ERROR) << "Malloc tensor data failed";
|
||||
return RET_ERROR;
|
||||
}
|
||||
ret = memcpy_s(tensor->MutableData(), tensor->Size(), param_value->tensor_addr(), param_value->tensor_size());
|
||||
ret = memcpy_s(tensor->MutableData(), tensor->Size(), tensor_info->data_c(), tensor_info->Size());
|
||||
if (tensor->Size() != 0 && ret != EOK) {
|
||||
MS_LOG(ERROR) << "memcpy error: " << ret;
|
||||
return RET_ERROR;
|
||||
}
|
||||
} else {
|
||||
int *data = reinterpret_cast<int *>(param_value->tensor_addr());
|
||||
int *data = reinterpret_cast<int *>(tensor_info->data_c());
|
||||
auto tensor_list = reinterpret_cast<lite::TensorList *>(tensor.get());
|
||||
if (tensor_list->Decode(data) != RET_OK) {
|
||||
return RET_ERROR;
|
||||
|
@ -349,10 +301,6 @@ bool InferShapePass::Run(const FuncGraphPtr &func_graph) {
|
|||
auto node_list = TopoSort(func_graph->get_return());
|
||||
for (auto &node : node_list) {
|
||||
if (utils::isa<ParameterPtr>(node)) {
|
||||
int status = SetParameterAbstract(node->cast<ParameterPtr>());
|
||||
if (status != RET_OK) {
|
||||
return false;
|
||||
}
|
||||
continue;
|
||||
}
|
||||
if (!utils::isa<CNodePtr>(node)) {
|
||||
|
|
|
@ -39,7 +39,6 @@ class InferShapePass : public Pass {
|
|||
abstract::AbstractTensorPtr ConvertLiteTensorToAbstractTensor(lite::Tensor *tensor);
|
||||
STATUS GetCNodeInputTensors(const CNodePtr &cnode, std::vector<lite::Tensor *> *input_tensors);
|
||||
STATUS GetCNodeOutputTensors(const CNodePtr &cnode, std::vector<lite::Tensor *> *output_tensors);
|
||||
STATUS SetParameterAbstract(const ParameterPtr ¶meter);
|
||||
STATUS SetCNodeAbstract(const std::vector<lite::Tensor *> &output_tensors, const std::shared_ptr<CNode> &cnode);
|
||||
int StrIsContain(const std::vector<std::string> &total, const std::string &aim);
|
||||
int SetSubGraphInputsAbstract(const CNodePtr &cnode, const FuncGraphPtr &func_graph);
|
||||
|
|
|
@ -21,7 +21,6 @@
|
|||
#include <string>
|
||||
#include "tools/optimizer/common/gllo_utils.h"
|
||||
#include "backend/optimizer/common/pass.h"
|
||||
#include "src/param_value_lite.h"
|
||||
#include "include/errorcode.h"
|
||||
|
||||
using mindspore::lite::STATUS;
|
||||
|
|
|
@ -14,7 +14,6 @@
|
|||
* limitations under the License.
|
||||
*/
|
||||
#include "tools/optimizer/graph/mindir_adjust_pass.h"
|
||||
#include <algorithm>
|
||||
#include <vector>
|
||||
#include <memory>
|
||||
|
||||
|
@ -22,15 +21,14 @@
|
|||
#include "tools/converter/quant_param_holder.h"
|
||||
#include "tools/converter/quantizer/quantize_util.h"
|
||||
#include "src/common/log_adapter.h"
|
||||
#include "src/tensor.h"
|
||||
|
||||
namespace mindspore {
|
||||
namespace opt {
|
||||
namespace {
|
||||
constexpr size_t kDoubleNum = 2;
|
||||
void FillDefaultInputQuantParamIfNeed(const PrimitivePtr &prim, const size_t &input_size) {
|
||||
auto quant_param_valueptr = prim->GetAttr("quant_params");
|
||||
if (quant_param_valueptr == nullptr) {
|
||||
auto quant_tensor_info_ptr = prim->GetAttr("quant_params");
|
||||
if (quant_tensor_info_ptr == nullptr) {
|
||||
prim->AddAttr("quant_params", std::make_shared<lite::QuantParamHolder>());
|
||||
}
|
||||
auto quant_param_holder = prim->GetAttr("quant_params")->cast<lite::QuantParamHolderPtr>();
|
||||
|
@ -63,8 +61,8 @@ void FillDefaultInputQuantParamIfNeed(const PrimitivePtr &prim, const size_t &in
|
|||
}
|
||||
|
||||
int ConvertInputQuantParam(const PrimitivePtr &prim, bool narrow_range, int32_t numbits) {
|
||||
auto quant_param_valueptr = prim->GetAttr("quant_params");
|
||||
if (quant_param_valueptr == nullptr) {
|
||||
auto quant_tensor_info_ptr = prim->GetAttr("quant_params");
|
||||
if (quant_tensor_info_ptr == nullptr) {
|
||||
prim->AddAttr("quant_params", std::make_shared<lite::QuantParamHolder>());
|
||||
}
|
||||
auto quant_param_holder = prim->GetAttr("quant_params")->cast<lite::QuantParamHolderPtr>();
|
||||
|
@ -123,8 +121,8 @@ int ConvertInputQuantParam(const PrimitivePtr &prim, bool narrow_range, int32_t
|
|||
}
|
||||
|
||||
int ConvertOutputQuantParam(const PrimitivePtr &prim, bool narrow_range, int32_t numbits) {
|
||||
auto quant_param_valueptr = prim->GetAttr("quant_params");
|
||||
if (quant_param_valueptr == nullptr) {
|
||||
auto quant_tensor_info_ptr = prim->GetAttr("quant_params");
|
||||
if (quant_tensor_info_ptr == nullptr) {
|
||||
prim->AddAttr("quant_params", std::make_shared<lite::QuantParamHolder>());
|
||||
}
|
||||
auto quant_param_holder = prim->GetAttr("quant_params")->cast<lite::QuantParamHolderPtr>();
|
||||
|
@ -156,8 +154,8 @@ int ConvertOutputQuantParam(const PrimitivePtr &prim, bool narrow_range, int32_t
|
|||
}
|
||||
|
||||
void CheckQuantParams(const PrimitivePtr &prim) {
|
||||
auto quant_param_valueptr = prim->GetAttr("quant_params");
|
||||
if (quant_param_valueptr == nullptr) {
|
||||
auto quant_tensor_info_ptr = prim->GetAttr("quant_params");
|
||||
if (quant_tensor_info_ptr == nullptr) {
|
||||
prim->AddAttr("quant_params", std::make_shared<lite::QuantParamHolder>());
|
||||
}
|
||||
auto quant_param_holder = prim->GetAttr("quant_params")->cast<lite::QuantParamHolderPtr>();
|
||||
|
@ -263,61 +261,6 @@ int MindirAdjustPass::ValueNodeInt64Convert(AnfNodePtr anf_node) {
|
|||
return lite::RET_NO_CHANGE;
|
||||
}
|
||||
|
||||
int MindirAdjustPass::ParameterNodeConvert(AnfNodePtr anf_node) {
|
||||
if (!utils::isa<ParameterPtr>(anf_node)) {
|
||||
MS_LOG(INFO) << "only parameter node need to convert tensor.";
|
||||
return lite::RET_NO_CHANGE;
|
||||
}
|
||||
auto param_node = anf_node->cast<ParameterPtr>();
|
||||
if (!param_node->has_default()) {
|
||||
MS_LOG(INFO) << "this is graph input, don't need to convert.";
|
||||
return lite::RET_NO_CHANGE;
|
||||
}
|
||||
if (utils::isa<ParamValueLitePtr>(param_node->default_param())) {
|
||||
MS_LOG(INFO) << "the tensor has been a paramvalueLite.";
|
||||
return lite::RET_NO_CHANGE;
|
||||
}
|
||||
ParamValueLitePtr param_value = std::make_shared<ParamValueLite>();
|
||||
if (param_value == nullptr) {
|
||||
MS_LOG(ERROR) << "fail to new a ParamValueLite.";
|
||||
return lite::RET_ERROR;
|
||||
}
|
||||
param_node->set_name(param_node->debug_info()->name());
|
||||
auto tensor_info = param_node->default_param()->cast<tensor::TensorPtr>();
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "the node is not a tensor::TensorPtr.";
|
||||
return lite::RET_ERROR;
|
||||
}
|
||||
param_value->set_tensor_size(tensor_info->Size());
|
||||
param_value->set_tensor_type(tensor_info->data_type());
|
||||
auto tensor_shape = tensor_info->shape();
|
||||
std::vector<int> shape;
|
||||
std::transform(tensor_shape.begin(), tensor_shape.end(), std::back_inserter(shape),
|
||||
[](int64_t value) { return static_cast<int>(value); });
|
||||
param_value->set_tensor_shape(shape);
|
||||
auto *tensor = new (std::nothrow) lite::Tensor(tensor_info->data_type(), shape);
|
||||
if (tensor == nullptr) {
|
||||
MS_LOG(ERROR) << "new a lite::tensor failed, get a nullptr.";
|
||||
return lite::RET_MEMORY_FAILED;
|
||||
}
|
||||
auto *tensor_data_buf = tensor->MutableData();
|
||||
if (tensor_data_buf == nullptr) {
|
||||
MS_LOG(ERROR) << "malloc tensor data failed.";
|
||||
delete tensor;
|
||||
return lite::RET_MEMORY_FAILED;
|
||||
}
|
||||
if (memcpy_s(tensor_data_buf, tensor_info->Size(), tensor_info->data_c(), tensor_info->Size()) != EOK) {
|
||||
MS_LOG(ERROR) << "memcpy_s error.";
|
||||
delete tensor;
|
||||
return lite::RET_MEMORY_FAILED;
|
||||
}
|
||||
tensor->set_data(nullptr);
|
||||
param_value->set_tensor_addr(tensor_data_buf);
|
||||
param_node->set_default_param(param_value);
|
||||
delete tensor;
|
||||
return lite::RET_OK;
|
||||
}
|
||||
|
||||
int MindirAdjustPass::ComputeQuantParams(std::shared_ptr<AnfNode> anf_node) {
|
||||
if (!utils::isa<CNodePtr>(anf_node)) {
|
||||
MS_LOG(INFO) << "only cnode need to convert primitive.";
|
||||
|
@ -357,9 +300,7 @@ bool MindirAdjustPass::Run(const FuncGraphPtr &graph) {
|
|||
int status = lite::RET_OK;
|
||||
bool success_flag = true;
|
||||
for (auto &node : node_list) {
|
||||
if (utils::isa<ParameterPtr>(node)) {
|
||||
status = ParameterNodeConvert(node);
|
||||
} else if (utils::isa<CNodePtr>(node)) {
|
||||
if (utils::isa<CNodePtr>(node)) {
|
||||
status = ComputeQuantParams(node);
|
||||
} else if (utils::isa<ValueNodePtr>(node)) {
|
||||
status = ValueNodeInt64Convert(node);
|
||||
|
|
|
@ -21,7 +21,6 @@
|
|||
#include "backend/optimizer/common/pass.h"
|
||||
#include "tools/converter/converter_flags.h"
|
||||
#include "tools/optimizer/common/gllo_utils.h"
|
||||
#include "src/param_value_lite.h"
|
||||
|
||||
using mindspore::lite::converter::FmkType;
|
||||
using mindspore::schema::QuantType;
|
||||
|
@ -34,7 +33,6 @@ class MindirAdjustPass : public Pass {
|
|||
void SetFmkType(FmkType fmk_type) { fmk_type_ = fmk_type; }
|
||||
int ValueNodeInt64Convert(AnfNodePtr anf_node);
|
||||
void SetTrainFlag(bool train_flag) { train_flag_ = train_flag; }
|
||||
int ParameterNodeConvert(AnfNodePtr anf_node);
|
||||
int ComputeQuantParams(AnfNodePtr anf_node);
|
||||
bool Run(const FuncGraphPtr &graph) override;
|
||||
|
||||
|
|
|
@ -14,13 +14,11 @@
|
|||
* limitations under the License.
|
||||
*/
|
||||
#include "tools/optimizer/graph/onnx_inputs_adjust_pass.h"
|
||||
#include <algorithm>
|
||||
#include <vector>
|
||||
#include <string>
|
||||
#include <functional>
|
||||
#include <memory>
|
||||
#include "ops/fusion/conv2d_fusion.h"
|
||||
#include "ops/fusion/conv2d_transpose_fusion.h"
|
||||
#include "ops/resize.h"
|
||||
#include "include/errorcode.h"
|
||||
|
||||
|
@ -89,12 +87,12 @@ STATUS OnnxInputAdjustOpPass::ReplaceInt64ParameterNode(const FuncGraphPtr &func
|
|||
MS_LOG(ERROR) << "default data is nullptr.";
|
||||
return lite::RET_NULL_PTR;
|
||||
}
|
||||
auto param_value = default_value->cast<ParamValueLitePtr>();
|
||||
if (param_value == nullptr) {
|
||||
MS_LOG(ERROR) << "default data is not paramvaluelite.";
|
||||
auto tensor_info = default_value->cast<tensor::TensorPtr>();
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "default data is not tensor::Tensor.";
|
||||
return lite::RET_NULL_PTR;
|
||||
}
|
||||
auto param_node_new = BuildParameterNode(func_graph, param_node, param_value);
|
||||
auto param_node_new = BuildParameterNode(func_graph, param_node, tensor_info);
|
||||
manager->Replace(param_node, param_node_new);
|
||||
} else {
|
||||
// set graph input
|
||||
|
@ -151,17 +149,17 @@ STATUS OnnxInputAdjustOpPass::ReplaceConstant(const FuncGraphPtr &func_graph, co
|
|||
MS_LOG(ERROR) << "value is not primitive_c.";
|
||||
return lite::RET_ERROR;
|
||||
}
|
||||
auto param_value = primitive_c->GetAttr("const_data");
|
||||
if (param_value == nullptr) {
|
||||
auto tensor_info = primitive_c->GetAttr("const_data");
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "constant cnode has no data.";
|
||||
return lite::RET_ERROR;
|
||||
}
|
||||
auto param_value_lite = param_value->cast<ParamValueLitePtr>();
|
||||
if (param_value_lite == nullptr) {
|
||||
MS_LOG(ERROR) << "valueptr is not paramvalueliteptr.";
|
||||
auto tensor_info_ptr = tensor_info->cast<tensor::TensorPtr>();
|
||||
if (tensor_info_ptr == nullptr) {
|
||||
MS_LOG(ERROR) << "valueptr is not tensor::Tensorptr.";
|
||||
return lite::RET_ERROR;
|
||||
}
|
||||
auto param_node = BuildParameterNode(func_graph, cnode, param_value_lite);
|
||||
auto param_node = BuildParameterNode(func_graph, cnode, tensor_info_ptr);
|
||||
if (param_node == nullptr) {
|
||||
MS_LOG(ERROR) << "convert constant to param node failed.";
|
||||
return lite::RET_ERROR;
|
||||
|
@ -199,17 +197,17 @@ STATUS OnnxInputAdjustOpPass::ReplaceTransposeWithGraphInput(const FuncGraphPtr
|
|||
auto perm_anf = cnode->input(2);
|
||||
auto perm_param = perm_anf->cast<ParameterPtr>();
|
||||
if (perm_param == nullptr || !perm_param->has_default() ||
|
||||
!utils::isa<ParamValueLitePtr>(perm_param->default_param())) {
|
||||
!utils::isa<tensor::TensorPtr>(perm_param->default_param())) {
|
||||
MS_LOG(DEBUG) << "transpose second input is not parameter node.";
|
||||
return lite::RET_OK;
|
||||
}
|
||||
auto perm_value = perm_param->default_param()->cast<ParamValueLitePtr>();
|
||||
if (perm_value->tensor_shape().empty()) {
|
||||
auto perm_value = perm_param->default_param()->cast<tensor::TensorPtr>();
|
||||
if (perm_value->shape().empty()) {
|
||||
MS_LOG(ERROR) << "transpose second input is invalid.";
|
||||
return lite::RET_ERROR;
|
||||
}
|
||||
std::vector<int> perm(perm_value->tensor_shape()[0]);
|
||||
if (memcpy_s(perm.data(), perm_value->tensor_size(), perm_value->tensor_addr(), perm_value->tensor_size()) != EOK) {
|
||||
std::vector<int> perm(perm_value->shape()[0]);
|
||||
if (memcpy_s(perm.data(), perm_value->Size(), perm_value->data_c(), perm_value->Size()) != EOK) {
|
||||
MS_LOG(ERROR) << "memcpy data failed.";
|
||||
return lite::RET_ERROR;
|
||||
}
|
||||
|
@ -252,12 +250,12 @@ STATUS OnnxInputAdjustOpPass::AdjustStridedSlice(const FuncGraphPtr &func_graph,
|
|||
if (param_node == nullptr || !param_node->has_default()) {
|
||||
continue;
|
||||
}
|
||||
const auto &default_data = param_node->default_param()->cast<ParamValueLitePtr>();
|
||||
const auto &default_data = param_node->default_param()->cast<tensor::TensorPtr>();
|
||||
if (default_data == nullptr) {
|
||||
MS_LOG(ERROR) << "this input is not a paramValueLite.";
|
||||
MS_LOG(ERROR) << "this input is not a tensor::Tensor";
|
||||
return lite::RET_ERROR;
|
||||
}
|
||||
auto shape = default_data->tensor_shape();
|
||||
auto shape = default_data->shape();
|
||||
size = std::accumulate(shape.begin(), shape.end(), 1, std::multiplies<int>());
|
||||
break;
|
||||
}
|
||||
|
|
|
@ -21,7 +21,7 @@
|
|||
#include "ops/reshape.h"
|
||||
#include "ops/transpose.h"
|
||||
#include "ops/primitive_c.h"
|
||||
#include "src/param_value_lite.h"
|
||||
#include "tools/common/tensor_util.h"
|
||||
#include "tools/optimizer/common/gllo_utils.h"
|
||||
|
||||
namespace mindspore::opt {
|
||||
|
@ -32,35 +32,22 @@ ParameterPtr OnnxPadAdjustPass::CreateNewParameter(const FuncGraphPtr &func_grap
|
|||
MS_ASSERT(func_graph != nullptr);
|
||||
MS_ASSERT(data != nullptr);
|
||||
auto parameter = func_graph->add_parameter();
|
||||
std::vector<int> shape;
|
||||
shape.push_back(static_cast<int>(data.size()));
|
||||
std::vector<int64_t> shape_vector;
|
||||
(void)std::transform(shape.begin(), shape.end(), std::back_inserter(shape_vector),
|
||||
[](const int32_t &value) { return static_cast<int64_t>(value); });
|
||||
auto type_id = static_cast<TypeId>(kNumberTypeInt32);
|
||||
auto type_ptr = TypeIdToType(type_id);
|
||||
auto abstract_tensor = std::make_shared<abstract::AbstractTensor>(type_ptr, shape_vector);
|
||||
parameter->set_abstract(abstract_tensor);
|
||||
|
||||
ParamValueLitePtr param_value = std::make_shared<ParamValueLite>();
|
||||
MS_ASSERT(param_value != nullptr);
|
||||
param_value->set_tensor_shape(shape);
|
||||
param_value->set_tensor_type(type_id);
|
||||
param_value->set_format(schema::Format_NCHW);
|
||||
|
||||
ShapeVector shape_vector;
|
||||
shape_vector.push_back(static_cast<int64_t>(data.size()));
|
||||
size_t size = data.size() * sizeof(int);
|
||||
auto tensor_data = new (std::nothrow) uint8_t[size];
|
||||
if (tensor_data == nullptr) {
|
||||
MS_LOG(ERROR) << "tensor_data is nullptr";
|
||||
|
||||
auto tensor_info = lite::CreateTensorInfo(data.data(), size, shape_vector, kNumberTypeInt32);
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "create tensor info failed.";
|
||||
return nullptr;
|
||||
}
|
||||
auto ret = memcpy_s(tensor_data, size, data.data(), size);
|
||||
if (ret != 0) {
|
||||
MS_LOG(ERROR) << "set tensor data failed.";
|
||||
|
||||
auto status = lite::InitParameterFromTensorInfo(parameter, tensor_info);
|
||||
if (status != RET_OK) {
|
||||
MS_LOG(ERROR) << "init parameter from tensor info failed";
|
||||
return nullptr;
|
||||
}
|
||||
param_value->SetTensorData(tensor_data, size);
|
||||
parameter->set_default_param(param_value);
|
||||
|
||||
return parameter;
|
||||
}
|
||||
|
||||
|
|
|
@ -44,17 +44,16 @@ std::vector<int> GetSliceBeginAndSize(const CNodePtr &cnode, const int index) {
|
|||
if (node == nullptr) {
|
||||
return content;
|
||||
}
|
||||
auto paramter_node = node->cast<ParameterPtr>();
|
||||
if (paramter_node == nullptr || !paramter_node->has_default() || paramter_node->default_param() == nullptr) {
|
||||
auto param_node = node->cast<ParameterPtr>();
|
||||
if (param_node == nullptr || !param_node->has_default() || param_node->default_param() == nullptr) {
|
||||
return content;
|
||||
}
|
||||
auto paramter_value = paramter_node->default_param()->cast<ParamValueLitePtr>();
|
||||
if (paramter_value == nullptr) {
|
||||
auto tensor_info = param_node->default_param()->cast<tensor::TensorPtr>();
|
||||
if (tensor_info == nullptr) {
|
||||
return content;
|
||||
}
|
||||
content.resize(paramter_value->tensor_shape_size());
|
||||
if (memcpy_s(content.data(), paramter_value->tensor_shape_size(), paramter_value->tensor_addr(),
|
||||
paramter_value->tensor_shape_size()) != EOK) {
|
||||
content.resize(tensor_info->DataSize());
|
||||
if (memcpy_s(content.data(), tensor_info->Size(), tensor_info->data_c(), tensor_info->Size()) != EOK) {
|
||||
MS_LOG(ERROR) << "memcpy data failed.";
|
||||
return {};
|
||||
}
|
||||
|
@ -91,12 +90,12 @@ std::vector<int64_t> GetDefaultParamShape(const ParameterPtr ¶m) {
|
|||
MS_LOG(ERROR) << "default_param is nullptr";
|
||||
return shape_vector;
|
||||
}
|
||||
if (!utils::isa<ParamValueLitePtr>(default_param)) {
|
||||
MS_LOG(ERROR) << "default_param is not ParamValueLite";
|
||||
if (!utils::isa<tensor::TensorPtr>(default_param)) {
|
||||
MS_LOG(ERROR) << "default_param is not tensor::Tensor";
|
||||
return shape_vector;
|
||||
}
|
||||
auto param_value_lite = utils::cast<ParamValueLitePtr>(default_param);
|
||||
auto shape = param_value_lite->tensor_shape();
|
||||
auto param_value_lite = utils::cast<tensor::TensorPtr>(default_param);
|
||||
auto shape = param_value_lite->shape();
|
||||
std::transform(shape.begin(), shape.end(), std::back_inserter(shape_vector),
|
||||
[](const int val) { return static_cast<int64_t>(val); });
|
||||
return shape_vector;
|
||||
|
@ -104,8 +103,8 @@ std::vector<int64_t> GetDefaultParamShape(const ParameterPtr ¶m) {
|
|||
|
||||
bool IsScalarNode(const AnfNodePtr &nodePtr) {
|
||||
if (utils::isa<ParameterPtr>(nodePtr) && nodePtr->cast<ParameterPtr>()->has_default()) {
|
||||
auto tensor = utils::cast<ParamValueLitePtr>(utils::cast<ParameterPtr>(nodePtr)->default_param());
|
||||
auto shape = tensor->tensor_shape();
|
||||
auto tensor = utils::cast<tensor::TensorPtr>(utils::cast<ParameterPtr>(nodePtr)->default_param());
|
||||
auto shape = tensor->shape();
|
||||
if (shape.empty() || (shape.size() == 1 && shape[0] == 1)) {
|
||||
return true;
|
||||
}
|
||||
|
@ -158,12 +157,12 @@ std::vector<int> GetTransposePerm(const CNodePtr &node) {
|
|||
if (!perm_param->has_default() || perm_param->default_param() == nullptr) {
|
||||
return perm;
|
||||
}
|
||||
auto perm_value = perm_param->default_param()->cast<ParamValueLitePtr>();
|
||||
auto perm_value = perm_param->default_param()->cast<tensor::TensorPtr>();
|
||||
if (perm_value == nullptr) {
|
||||
return perm;
|
||||
}
|
||||
perm.resize(perm_value->tensor_shape()[0]);
|
||||
if (memcpy_s(perm.data(), perm_value->tensor_size(), perm_value->tensor_addr(), perm_value->tensor_size()) != EOK) {
|
||||
perm.resize(perm_value->shape()[0]);
|
||||
if (memcpy_s(perm.data(), perm_value->Size(), perm_value->data_c(), perm_value->Size()) != EOK) {
|
||||
MS_LOG(ERROR) << "memcpy failed.";
|
||||
return {};
|
||||
}
|
||||
|
|
|
@ -106,12 +106,12 @@ STATUS TfliteInputsAdjustPass::ReplaceInt64ParameterNode(const FuncGraphPtr &fun
|
|||
MS_LOG(ERROR) << "default data is nullptr.";
|
||||
return lite::RET_NULL_PTR;
|
||||
}
|
||||
auto param_value = default_value->cast<ParamValueLitePtr>();
|
||||
if (param_value == nullptr) {
|
||||
MS_LOG(ERROR) << "default data is not paramvaluelite.";
|
||||
auto tensor_info = default_value->cast<tensor::TensorPtr>();
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "default data is not tensor::Tensor.";
|
||||
return lite::RET_NULL_PTR;
|
||||
}
|
||||
auto param_node_new = BuildParameterNode(func_graph, param_node, param_value);
|
||||
auto param_node_new = BuildParameterNode(func_graph, param_node, tensor_info);
|
||||
manager->Replace(param_node, param_node_new);
|
||||
} else {
|
||||
// set graph input
|
||||
|
|
|
@ -19,7 +19,6 @@
|
|||
#include <string>
|
||||
#include "tools/converter/converter_flags.h"
|
||||
#include "backend/optimizer/common/pass.h"
|
||||
#include "src/param_value_lite.h"
|
||||
#include "tools/optimizer/common/gllo_utils.h"
|
||||
|
||||
namespace mindspore::opt {
|
||||
|
|
|
@ -44,12 +44,12 @@ std::vector<int> GetTransposePerm(const CNodePtr &node) {
|
|||
if (!perm_param->has_default() || perm_param->default_param() == nullptr) {
|
||||
return perm;
|
||||
}
|
||||
auto perm_value = perm_param->default_param()->cast<ParamValueLitePtr>();
|
||||
auto perm_value = perm_param->default_param()->cast<tensor::TensorPtr>();
|
||||
if (perm_value == nullptr) {
|
||||
return perm;
|
||||
}
|
||||
perm.resize(perm_value->tensor_shape()[0]);
|
||||
if (memcpy_s(perm.data(), perm_value->tensor_size(), perm_value->tensor_addr(), perm_value->tensor_size()) != EOK) {
|
||||
perm.resize(perm_value->shape()[0]);
|
||||
if (memcpy_s(perm.data(), perm_value->Size(), perm_value->data_c(), perm_value->Size()) != EOK) {
|
||||
MS_LOG(ERROR) << "memcpy failed.";
|
||||
return {};
|
||||
}
|
||||
|
|
|
@ -52,8 +52,8 @@ lite::STATUS UpdateConv2DParamPass::UpdateCommonConv2D(const CNodePtr &cnode) {
|
|||
return lite::RET_NO_CHANGE;
|
||||
}
|
||||
auto default_param = weight_param->default_param();
|
||||
auto weight_tensor = std::dynamic_pointer_cast<ParamValueLite>(default_param);
|
||||
auto weight_shape = weight_tensor->tensor_shape();
|
||||
auto weight_tensor = std::dynamic_pointer_cast<tensor::Tensor>(default_param);
|
||||
auto weight_shape = weight_tensor->shape();
|
||||
std::vector<int64_t> kernel_size = {weight_shape[0], weight_shape[1]};
|
||||
conv->set_kernel_size(kernel_size);
|
||||
conv->set_in_channel(weight_shape[2]);
|
||||
|
@ -75,8 +75,8 @@ lite::STATUS UpdateConv2DParamPass::UpdateDepthWiseConv2D(const CNodePtr &cnode)
|
|||
if (input_node->isa<Parameter>()) {
|
||||
auto param_node = input_node->cast<ParameterPtr>();
|
||||
auto param = param_node->default_param();
|
||||
auto weight = std::dynamic_pointer_cast<ParamValueLite>(param);
|
||||
conv->set_in_channel(static_cast<int64_t>(weight->tensor_shape().at(0)));
|
||||
auto weight = std::dynamic_pointer_cast<tensor::Tensor>(param);
|
||||
conv->set_in_channel(static_cast<int64_t>(weight->shape().at(0)));
|
||||
}
|
||||
}
|
||||
return lite::RET_OK;
|
||||
|
|
|
@ -36,14 +36,19 @@ const PrimitivePtr kPrimConv2DBackpropInputFusion = std::make_shared<Primitive>(
|
|||
void WeightFormatHardCodePass::SetQuantType(QuantType type) { this->quant_type = type; }
|
||||
void WeightFormatHardCodePass::SetFmkType(FmkType type) { this->fmk_type = type; }
|
||||
lite::STATUS WeightFormatHardCodePass::HardCodeCAFFE(const CNodePtr &conv_node,
|
||||
const ParamValueLitePtr ¶m_value) const {
|
||||
const tensor::TensorPtr &tensor_info) const {
|
||||
MS_ASSERT(conv_cnode != nullptr);
|
||||
MS_ASSERT(param_value != nullptr);
|
||||
MS_ASSERT(tensor_info != nullptr);
|
||||
auto prim = GetValueNode<PrimitivePtr>(conv_node->input(0));
|
||||
if (prim == nullptr) {
|
||||
MS_LOG(ERROR) << "Invalid anfnode, which don't have primitive.";
|
||||
return lite::RET_ERROR;
|
||||
}
|
||||
switch (quant_type) {
|
||||
case schema::QuantType_PostTraining:
|
||||
case QuantType_WeightQuant:
|
||||
case QuantType_QUANT_NONE:
|
||||
param_value->set_format(schema::Format::Format_KCHW);
|
||||
prim->AddAttr(opt::kWeightFormat, MakeValue<int64_t>(Format::KCHW));
|
||||
break;
|
||||
default: {
|
||||
MS_LOG(ERROR) << "Unsupported quantType: " << EnumNameQuantType(quant_type)
|
||||
|
@ -55,9 +60,9 @@ lite::STATUS WeightFormatHardCodePass::HardCodeCAFFE(const CNodePtr &conv_node,
|
|||
}
|
||||
|
||||
lite::STATUS WeightFormatHardCodePass::HardCodeONNX(const CNodePtr &conv_node,
|
||||
const ParamValueLitePtr ¶m_value) const {
|
||||
const tensor::TensorPtr &tensor_info) const {
|
||||
MS_ASSERT(conv_cnode != nullptr);
|
||||
MS_ASSERT(param_value != nullptr);
|
||||
MS_ASSERT(tensor_info != nullptr);
|
||||
auto prim = GetValueNode<PrimitivePtr>(conv_node->input(0));
|
||||
if (prim == nullptr) {
|
||||
MS_LOG(ERROR) << "Invalid anfnode, which don't have primitive.";
|
||||
|
@ -70,12 +75,12 @@ lite::STATUS WeightFormatHardCodePass::HardCodeONNX(const CNodePtr &conv_node,
|
|||
// sum up from current onnx quant models
|
||||
if (CheckPrimitiveType(conv_node, prim::kPrimConv2DFusion)) {
|
||||
if (!is_depth_wise) {
|
||||
param_value->set_format(schema::Format::Format_KHWC);
|
||||
prim->AddAttr(opt::kWeightFormat, MakeValue<int64_t>(Format::KHWC));
|
||||
} else {
|
||||
param_value->set_format(schema::Format::Format_CHWK);
|
||||
prim->AddAttr(opt::kWeightFormat, MakeValue<int64_t>(Format::CHWK));
|
||||
}
|
||||
} else if (CheckPrimitiveType(conv_node, prim::kPrimConv2dTransposeFusion) && !is_depth_wise) {
|
||||
param_value->set_format(schema::Format::Format_KCHW);
|
||||
prim->AddAttr(opt::kWeightFormat, MakeValue<int64_t>(Format::KCHW));
|
||||
} else {
|
||||
MS_LOG(ERROR) << "Unsupported op: " << conv_node->fullname_with_scope();
|
||||
return lite::RET_ERROR;
|
||||
|
@ -91,9 +96,9 @@ lite::STATUS WeightFormatHardCodePass::HardCodeONNX(const CNodePtr &conv_node,
|
|||
if (CheckPrimitiveType(conv_node, prim::kPrimConv2DFusion) ||
|
||||
CheckPrimitiveType(conv_node, prim::kPrimConv2dTransposeFusion)) {
|
||||
if (format == schema::Format::Format_NHWC) {
|
||||
param_value->set_format(schema::Format::Format_KHWC);
|
||||
prim->AddAttr(opt::kWeightFormat, MakeValue<int64_t>(Format::KHWC));
|
||||
} else {
|
||||
param_value->set_format(schema::Format::Format_KCHW);
|
||||
prim->AddAttr(opt::kWeightFormat, MakeValue<int64_t>(Format::KCHW));
|
||||
}
|
||||
}
|
||||
} break;
|
||||
|
@ -107,9 +112,9 @@ lite::STATUS WeightFormatHardCodePass::HardCodeONNX(const CNodePtr &conv_node,
|
|||
}
|
||||
|
||||
lite::STATUS WeightFormatHardCodePass::HardCodeMS(const CNodePtr &conv_node,
|
||||
const ParamValueLitePtr ¶m_value) const {
|
||||
const tensor::TensorPtr &tensor_info) const {
|
||||
MS_ASSERT(conv_cnode != nullptr);
|
||||
MS_ASSERT(param_value != nullptr);
|
||||
MS_ASSERT(tensor_info != nullptr);
|
||||
auto prim = GetValueNode<PrimitivePtr>(conv_node->input(0));
|
||||
if (prim == nullptr) {
|
||||
MS_LOG(ERROR) << "Invalid anfnode, which don't have primitive.";
|
||||
|
@ -122,7 +127,7 @@ lite::STATUS WeightFormatHardCodePass::HardCodeMS(const CNodePtr &conv_node,
|
|||
case QuantType_WeightQuant:
|
||||
case QuantType_QUANT_NONE: {
|
||||
// sum up from current ms quant models
|
||||
param_value->set_format(schema::Format::Format_KCHW);
|
||||
prim->AddAttr(opt::kWeightFormat, MakeValue<int64_t>(Format::KCHW));
|
||||
} break;
|
||||
default: {
|
||||
MS_LOG(ERROR) << "Unsupported quantType: " << EnumNameQuantType(quant_type)
|
||||
|
@ -134,9 +139,9 @@ lite::STATUS WeightFormatHardCodePass::HardCodeMS(const CNodePtr &conv_node,
|
|||
}
|
||||
|
||||
lite::STATUS WeightFormatHardCodePass::HardCodeTFLITE(const CNodePtr &conv_node,
|
||||
const ParamValueLitePtr ¶m_value) const {
|
||||
const tensor::TensorPtr &tensor_info) const {
|
||||
MS_ASSERT(conv_cnode != nullptr);
|
||||
MS_ASSERT(param_value != nullptr);
|
||||
MS_ASSERT(tensor_info != nullptr);
|
||||
auto prim = GetValueNode<PrimitivePtr>(conv_node->input(0));
|
||||
if (prim == nullptr) {
|
||||
MS_LOG(ERROR) << "Invalid anfnode, which don't have primitive.";
|
||||
|
@ -150,12 +155,12 @@ lite::STATUS WeightFormatHardCodePass::HardCodeTFLITE(const CNodePtr &conv_node,
|
|||
case QuantType_QUANT_NONE: {
|
||||
if (CheckPrimitiveType(conv_node, prim::kPrimConv2DFusion)) {
|
||||
if (!is_depth_wise) {
|
||||
param_value->set_format(schema::Format::Format_KHWC);
|
||||
prim->AddAttr(opt::kWeightFormat, MakeValue<int64_t>(Format::KHWC));
|
||||
} else {
|
||||
param_value->set_format(schema::Format::Format_CHWK);
|
||||
prim->AddAttr(opt::kWeightFormat, MakeValue<int64_t>(Format::CHWK));
|
||||
}
|
||||
} else if (CheckPrimitiveType(conv_node, prim::kPrimConv2dTransposeFusion) && !is_depth_wise) {
|
||||
param_value->set_format(schema::Format::Format_CHWK);
|
||||
prim->AddAttr(opt::kWeightFormat, MakeValue<int64_t>(Format::CHWK));
|
||||
}
|
||||
} break;
|
||||
default: {
|
||||
|
@ -167,9 +172,9 @@ lite::STATUS WeightFormatHardCodePass::HardCodeTFLITE(const CNodePtr &conv_node,
|
|||
}
|
||||
|
||||
lite::STATUS WeightFormatHardCodePass::HardCodeTF(const CNodePtr &conv_node,
|
||||
const ParamValueLitePtr ¶m_value) const {
|
||||
const tensor::TensorPtr &tensor_info) const {
|
||||
MS_ASSERT(conv_cnode != nullptr);
|
||||
MS_ASSERT(param_value != nullptr);
|
||||
MS_ASSERT(tensor_info != nullptr);
|
||||
auto prim = GetValueNode<PrimitivePtr>(conv_node->input(0));
|
||||
if (prim == nullptr) {
|
||||
MS_LOG(ERROR) << "Invalid anfnode, which don't have primitive.";
|
||||
|
@ -179,13 +184,13 @@ lite::STATUS WeightFormatHardCodePass::HardCodeTF(const CNodePtr &conv_node,
|
|||
if (CheckPrimitiveType(conv_node, prim::kPrimConv2DFusion)) {
|
||||
{
|
||||
if (!is_depth_wise) {
|
||||
param_value->set_format(schema::Format::Format_HWCK);
|
||||
prim->AddAttr(opt::kWeightFormat, MakeValue<int64_t>(Format::HWCK));
|
||||
} else {
|
||||
param_value->set_format(schema::Format::Format_HWKC);
|
||||
prim->AddAttr(opt::kWeightFormat, MakeValue<int64_t>(Format::HWKC));
|
||||
}
|
||||
}
|
||||
} else if (CheckPrimitiveType(conv_node, prim::kPrimConv2dTransposeFusion) && !is_depth_wise) {
|
||||
param_value->set_format(schema::Format::Format_HWCK);
|
||||
prim->AddAttr(opt::kWeightFormat, MakeValue<int64_t>(Format::HWCK));
|
||||
}
|
||||
return lite::RET_OK;
|
||||
}
|
||||
|
@ -206,27 +211,27 @@ bool WeightFormatHardCodePass::Run(const FuncGraphPtr &graph) {
|
|||
MS_ASSERT(conv_cnode->inputs().size() > kConvWeightIndex);
|
||||
auto weight_node = conv_cnode->input(kConvWeightIndex);
|
||||
MS_ASSERT(weight_node != nullptr);
|
||||
auto param_value = GetLiteParamValue(weight_node);
|
||||
if (param_value == nullptr) {
|
||||
auto tensor_info = GetTensorInfo(weight_node);
|
||||
if (tensor_info == nullptr) {
|
||||
MS_LOG(ERROR) << "weight node must param value";
|
||||
return false;
|
||||
}
|
||||
lite::STATUS status;
|
||||
switch (fmk_type) {
|
||||
case FmkType_CAFFE:
|
||||
status = HardCodeCAFFE(conv_cnode, param_value);
|
||||
status = HardCodeCAFFE(conv_cnode, tensor_info);
|
||||
break;
|
||||
case FmkType_TFLITE:
|
||||
status = HardCodeTFLITE(conv_cnode, param_value);
|
||||
status = HardCodeTFLITE(conv_cnode, tensor_info);
|
||||
break;
|
||||
case FmkType_TF:
|
||||
status = HardCodeTF(conv_cnode, param_value);
|
||||
status = HardCodeTF(conv_cnode, tensor_info);
|
||||
break;
|
||||
case FmkType_ONNX:
|
||||
status = HardCodeONNX(conv_cnode, param_value);
|
||||
status = HardCodeONNX(conv_cnode, tensor_info);
|
||||
break;
|
||||
case FmkType_MS:
|
||||
status = HardCodeMS(conv_cnode, param_value);
|
||||
status = HardCodeMS(conv_cnode, tensor_info);
|
||||
break;
|
||||
default:
|
||||
MS_LOG(ERROR) << "Unsupported fmkType: " << fmk_type << ", node: " << node->fullname_with_scope();
|
||||
|
|
|
@ -20,7 +20,6 @@
|
|||
#include "schema/inner/model_generated.h"
|
||||
#include "tools/converter/converter_flags.h"
|
||||
#include "backend/optimizer/common/pass.h"
|
||||
#include "src/param_value_lite.h"
|
||||
|
||||
using mindspore::lite::converter::FmkType;
|
||||
using mindspore::schema::QuantType;
|
||||
|
@ -34,11 +33,11 @@ class WeightFormatHardCodePass : public Pass {
|
|||
bool Run(const FuncGraphPtr &graph) override;
|
||||
|
||||
private:
|
||||
lite::STATUS HardCodeCAFFE(const CNodePtr &node, const ParamValueLitePtr ¶m_value) const;
|
||||
lite::STATUS HardCodeONNX(const CNodePtr &node, const ParamValueLitePtr ¶m_value) const;
|
||||
lite::STATUS HardCodeMS(const CNodePtr &node, const ParamValueLitePtr ¶m_value) const;
|
||||
lite::STATUS HardCodeTFLITE(const CNodePtr &node, const ParamValueLitePtr ¶m_value) const;
|
||||
lite::STATUS HardCodeTF(const CNodePtr &conv_node, const ParamValueLitePtr ¶m_value) const;
|
||||
lite::STATUS HardCodeCAFFE(const CNodePtr &node, const tensor::TensorPtr &tensor_info) const;
|
||||
lite::STATUS HardCodeONNX(const CNodePtr &node, const tensor::TensorPtr &tensor_info) const;
|
||||
lite::STATUS HardCodeMS(const CNodePtr &node, const tensor::TensorPtr &tensor_info) const;
|
||||
lite::STATUS HardCodeTFLITE(const CNodePtr &node, const tensor::TensorPtr &tensor_info) const;
|
||||
lite::STATUS HardCodeTF(const CNodePtr &conv_node, const tensor::TensorPtr &tensor_info) const;
|
||||
|
||||
private:
|
||||
QuantType quant_type = schema::QuantType_QUANT_NONE;
|
||||
|
|
|
@ -69,9 +69,7 @@ lite::STATUS WeightFormatTransformPass::TransposeInsertForWeightSharing(const Fu
|
|||
if (!utils::isa<CNode>(node)) {
|
||||
continue;
|
||||
}
|
||||
if (CheckPrimitiveType(node, prim::kPrimConv2DFusion) || CheckPrimitiveType(node, kPrimConv2DBackpropInputFusion) ||
|
||||
CheckPrimitiveType(node, prim::kPrimConv2dTransposeFusion) ||
|
||||
CheckPrimitiveType(node, prim::kPrimApplyMomentum) || CheckPrimitiveType(node, prim::kPrimSGD) ||
|
||||
if (CheckPrimitiveType(node, prim::kPrimApplyMomentum) || CheckPrimitiveType(node, prim::kPrimSGD) ||
|
||||
CheckPrimitiveType(node, prim::kPrimAdam)) {
|
||||
continue;
|
||||
}
|
||||
|
@ -79,6 +77,13 @@ lite::STATUS WeightFormatTransformPass::TransposeInsertForWeightSharing(const Fu
|
|||
auto inputs = cnode->inputs();
|
||||
if (std::any_of(inputs.begin(), inputs.end(),
|
||||
[&weight_node](const AnfNodePtr &anf_node) { return weight_node == anf_node; })) {
|
||||
if (CheckPrimitiveType(node, prim::kPrimConv2DFusion) ||
|
||||
CheckPrimitiveType(node, kPrimConv2DBackpropInputFusion) ||
|
||||
CheckPrimitiveType(node, prim::kPrimConv2dTransposeFusion)) {
|
||||
auto prim = GetValueNode<PrimitivePtr>(cnode->input(0));
|
||||
prim->AddAttr(kWeightFormat, MakeValue<int64_t>(mindspore::KHWC));
|
||||
continue;
|
||||
}
|
||||
adjust_nodes.push_back(cnode);
|
||||
}
|
||||
}
|
||||
|
@ -138,9 +143,14 @@ lite::STATUS WeightFormatTransformPass::ConvWeightFormatTrans(const FuncGraphPtr
|
|||
}
|
||||
auto conv_cnode = node->cast<CNodePtr>();
|
||||
MS_ASSERT(conv_cnode->inputs().size() > kConvWeightIndex);
|
||||
auto prim = GetValueNode<PrimitivePtr>(conv_cnode->input(0));
|
||||
if (prim == nullptr) {
|
||||
MS_LOG(ERROR) << "Invalid anfnode, which don't have primitive.";
|
||||
return lite::RET_ERROR;
|
||||
}
|
||||
auto weight_node = conv_cnode->input(kConvWeightIndex);
|
||||
MS_ASSERT(weight_node != nullptr);
|
||||
auto weight_value = GetLiteParamValue(weight_node);
|
||||
auto weight_value = GetTensorInfo(weight_node);
|
||||
if (weight_value == nullptr) {
|
||||
MS_LOG(ERROR) << "weight node must param value";
|
||||
return false;
|
||||
|
@ -148,31 +158,30 @@ lite::STATUS WeightFormatTransformPass::ConvWeightFormatTrans(const FuncGraphPtr
|
|||
MS_ASSERT(weight_value->tensor_type() == TypeId::kNumberTypeFloat32 ||
|
||||
weight_value->tensor_type() == TypeId::kNumberTypeUInt8);
|
||||
lite::STATUS status;
|
||||
schema::Format src_format = static_cast<schema::Format>(weight_value->format());
|
||||
auto value_ptr = prim->GetAttr(opt::kWeightFormat);
|
||||
auto weight_src_format = static_cast<schema::Format>(GetValue<int64_t>(value_ptr));
|
||||
schema::Format weight_dst_format = schema::Format::Format_KHWC;
|
||||
if (dst_format != schema::Format::Format_NUM_OF_FORMAT) {
|
||||
weight_dst_format = dst_format;
|
||||
}
|
||||
status = TransFilterFormat(weight_value, weight_dst_format);
|
||||
status = TransFilterFormat(weight_value, weight_src_format, weight_dst_format);
|
||||
if (status == RET_OK) {
|
||||
weight_value->set_format(weight_dst_format);
|
||||
prim->AddAttr(opt::kWeightFormat, MakeValue<int64_t>(weight_dst_format));
|
||||
} else {
|
||||
MS_LOG(ERROR) << "TransFilter " << EnumNameFormat(schema::EnumValuesFormat()[weight_value->format()]) << "To"
|
||||
MS_LOG(ERROR) << "TransFilter " << EnumNameFormat(schema::EnumValuesFormat()[weight_dst_format]) << "To"
|
||||
<< EnumNameFormat(weight_dst_format) << " failed, node : " << node->fullname_with_scope()
|
||||
<< "quant type:" << quant_type;
|
||||
return ERROR;
|
||||
}
|
||||
status = HandleWeightSharing(graph, weight_node->cast<ParameterPtr>(), src_format, weight_dst_format);
|
||||
status = HandleWeightSharing(graph, weight_node->cast<ParameterPtr>(), weight_src_format, weight_dst_format);
|
||||
if (status != lite::RET_OK) {
|
||||
MS_LOG(ERROR) << "handle weight-sharing failed.";
|
||||
return false;
|
||||
}
|
||||
auto type_id = static_cast<TypeId>(weight_value->tensor_type());
|
||||
auto type_id = static_cast<TypeId>(weight_value->data_type());
|
||||
auto type_ptr = TypeIdToType(type_id);
|
||||
auto shape = weight_value->tensor_shape();
|
||||
std::vector<int64_t> shape_vector;
|
||||
(void)std::transform(shape.begin(), shape.end(), std::back_inserter(shape_vector),
|
||||
[](const int32_t &value) { return static_cast<int64_t>(value); });
|
||||
auto shape = weight_value->shape();
|
||||
std::vector<int64_t> shape_vector(shape.begin(), shape.end());
|
||||
auto abstract_tensor = std::make_shared<abstract::AbstractTensor>(type_ptr, shape_vector);
|
||||
weight_node->set_abstract(abstract_tensor);
|
||||
}
|
||||
|
|
|
@ -21,7 +21,6 @@
|
|||
#include "schema/inner/model_generated.h"
|
||||
#include "tools/converter/converter_flags.h"
|
||||
#include "backend/optimizer/common/pass.h"
|
||||
#include "src/param_value_lite.h"
|
||||
|
||||
using mindspore::lite::converter::FmkType;
|
||||
namespace mindspore::opt {
|
||||
|
|
Loading…
Reference in New Issue