forked from mindspore-Ecosystem/mindspore
!10922 optimize somas logs
From: @laiyongqiang Reviewed-by: Signed-off-by:
This commit is contained in:
commit
bb2870fe71
|
@ -63,7 +63,7 @@ bool Somas::Allocate(const session::KernelGraph *graph) {
|
|||
MS_LOG(EXCEPTION) << "Somas Assign Failed.";
|
||||
}
|
||||
|
||||
GenStatisticInfo();
|
||||
GenGraphStatisticInfo();
|
||||
return ret;
|
||||
}
|
||||
|
||||
|
@ -87,6 +87,10 @@ bool Somas::InitSomasTensors(const session::KernelGraph *graph) {
|
|||
<< contiguous_tensors_list_.size() << " contiguous lists";
|
||||
|
||||
if (save_graphs_) {
|
||||
std::string file_path =
|
||||
save_graphs_path_ + "/" + "somas_pre_processed_info_" + std::to_string(graph->graph_id()) + ".ir";
|
||||
DumpSomasInfoIR(file_path);
|
||||
|
||||
std::string offline_file_path =
|
||||
save_graphs_path_ + "/" + "somas_offline_log_" + std::to_string(graph->graph_id()) + ".ir";
|
||||
DumpOfflineIR(offline_file_path);
|
||||
|
@ -182,6 +186,14 @@ void Somas::InitSomasInputTensors(const session::KernelGraph *graph) {
|
|||
bool is_all_nop_node = opt::IsAllNopNode(graph);
|
||||
auto kernel_cnodes = graph->execution_order();
|
||||
for (const auto &kernel : kernel_cnodes) {
|
||||
if (AnfAlgo::GetCNodeName(kernel) != kAtomicAddrCleanOpName) {
|
||||
InitCommonNodeInputs(is_all_nop_node, kernel);
|
||||
} else {
|
||||
InitAtomicCleanInputs(is_all_nop_node, kernel);
|
||||
}
|
||||
}
|
||||
}
|
||||
void Somas::InitCommonNodeInputs(bool is_all_nop_node, const CNodePtr &kernel) {
|
||||
auto node = nodes_map_[kernel.get()];
|
||||
MS_EXCEPTION_IF_NULL(node);
|
||||
auto stream = node->GetStream();
|
||||
|
@ -202,6 +214,8 @@ void Somas::InitSomasInputTensors(const session::KernelGraph *graph) {
|
|||
}
|
||||
|
||||
if (!AnfAlgo::IsRealCNodeKernel(prenode_index.first)) {
|
||||
auto parameter = GetSomasParameters(prenode_index.first, prenode_index.second);
|
||||
node->input_parameters_map_[i] = parameter;
|
||||
MS_LOG(DEBUG) << "Input [" << prenode_index.first->fullname_with_scope() << "] is not a real cnode kernel.";
|
||||
continue;
|
||||
}
|
||||
|
@ -239,6 +253,100 @@ void Somas::InitSomasInputTensors(const session::KernelGraph *graph) {
|
|||
}
|
||||
}
|
||||
}
|
||||
|
||||
void Somas::InitAtomicCleanInputs(bool is_all_nop_node, const CNodePtr &kernel) {
|
||||
auto node = nodes_map_[kernel.get()];
|
||||
MS_EXCEPTION_IF_NULL(node);
|
||||
auto stream = node->GetStream();
|
||||
MS_EXCEPTION_IF_NULL(stream);
|
||||
|
||||
MS_EXCEPTION_IF_NULL(kernel->inputs()[1]);
|
||||
auto pre_node = (kernel->inputs()[1])->cast<CNodePtr>();
|
||||
auto iter = nodes_map_.find(pre_node.get());
|
||||
if (iter == nodes_map_.end()) {
|
||||
MS_LOG(EXCEPTION) << "Kernel[" << kernel->fullname_with_scope() << "]'s input [" << pre_node->fullname_with_scope()
|
||||
<< "] is not init.";
|
||||
}
|
||||
auto pre_somas_node = iter->second;
|
||||
// set clean output tensors
|
||||
if (AnfAlgo::HasNodeAttr(kAttrAtomicOutputIndexs, pre_node)) {
|
||||
auto clean_output_indexs = AnfAlgo::GetNodeAttr<std::vector<size_t>>(pre_node, kAttrAtomicOutputIndexs);
|
||||
for (auto index : clean_output_indexs) {
|
||||
if (index > pre_somas_node->output_tensors_.size()) {
|
||||
MS_LOG(EXCEPTION) << "Output index " << index << " exceed input node [" << pre_node->fullname_with_scope()
|
||||
<< "]'s outputs size " << pre_somas_node->output_tensors_.size();
|
||||
}
|
||||
auto input_somas_tensor = pre_somas_node->output_tensors_[index];
|
||||
MS_EXCEPTION_IF_NULL(input_somas_tensor);
|
||||
node->input_tensors_.push_back(input_somas_tensor);
|
||||
input_somas_tensor->destinations_.insert(node);
|
||||
input_somas_tensor->destinationStreams_.insert(stream);
|
||||
if (input_somas_tensor->lifetime_.start_ > node->GetId()) {
|
||||
input_somas_tensor->lifetime_.start_ = node->GetId();
|
||||
}
|
||||
node->ancestor_nodes_.insert(pre_somas_node);
|
||||
auto input_tensor_stream = input_somas_tensor->GetSourceStream();
|
||||
if (input_tensor_stream != stream) {
|
||||
stream->ancestor_streams_.insert(input_tensor_stream);
|
||||
input_somas_tensor->between_streams_ = true;
|
||||
}
|
||||
}
|
||||
}
|
||||
// set clean workspace tensors
|
||||
if (AnfAlgo::HasNodeAttr(kAttrAtomicWorkspaceIndexs, pre_node)) {
|
||||
auto clean_workspace_indexs = AnfAlgo::GetNodeAttr<std::vector<size_t>>(pre_node, kAttrAtomicWorkspaceIndexs);
|
||||
for (const auto &index : clean_workspace_indexs) {
|
||||
if (index > pre_somas_node->output_tensors_.size()) {
|
||||
MS_LOG(EXCEPTION) << "Workspace index " << index << " exceed input node [" << pre_node->fullname_with_scope()
|
||||
<< "]'s Workspace size " << pre_somas_node->workspace_tensors_.size();
|
||||
}
|
||||
auto input_somas_tensor = pre_somas_node->workspace_tensors_[index];
|
||||
MS_EXCEPTION_IF_NULL(input_somas_tensor);
|
||||
node->input_tensors_.push_back(input_somas_tensor);
|
||||
input_somas_tensor->destinations_.insert(node);
|
||||
input_somas_tensor->destinationStreams_.insert(stream);
|
||||
if (input_somas_tensor->lifetime_.start_ > node->GetId()) {
|
||||
input_somas_tensor->lifetime_.start_ = node->GetId();
|
||||
}
|
||||
node->ancestor_nodes_.insert(pre_somas_node);
|
||||
auto input_tensor_stream = input_somas_tensor->GetSourceStream();
|
||||
if (input_tensor_stream != stream) {
|
||||
stream->ancestor_streams_.insert(input_tensor_stream);
|
||||
input_somas_tensor->between_streams_ = true;
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
SomasParameterPtr Somas::CreateSomasParameters(AnfNodePtr node, size_t index) {
|
||||
auto id = parameters_list_.size();
|
||||
auto device_addr = AnfAlgo::GetOutputAddr(node, index);
|
||||
if (device_addr == nullptr) {
|
||||
MS_LOG(EXCEPTION) << "Node " << node->fullname_with_scope() << " has no device address before Somas.";
|
||||
}
|
||||
auto param = std::make_shared<SomasParameter>(id, node, index, device_addr->GetPtr(), device_addr->GetSize());
|
||||
parameters_list_.push_back(param);
|
||||
return param;
|
||||
}
|
||||
|
||||
SomasParameterPtr Somas::GetSomasParameters(AnfNodePtr node, size_t index) {
|
||||
auto key = node.get();
|
||||
auto iter = parameters_map_.find(key);
|
||||
if (iter != parameters_map_.end()) {
|
||||
auto it = std::find_if(iter->second.begin(), iter->second.end(),
|
||||
[index](SomasParameterPtr param) -> bool { return index == param->output_index_; });
|
||||
if (it != iter->second.end()) {
|
||||
return *it;
|
||||
} else {
|
||||
auto new_param = CreateSomasParameters(node, index);
|
||||
iter->second.push_back(new_param);
|
||||
return new_param;
|
||||
}
|
||||
} else {
|
||||
auto new_param = CreateSomasParameters(node, index);
|
||||
parameters_map_[key].push_back(new_param);
|
||||
return new_param;
|
||||
}
|
||||
}
|
||||
|
||||
void Somas::InitBasicInfo(const session::KernelGraph *graph) {
|
||||
|
@ -258,8 +366,8 @@ void Somas::InitBasicInfo(const session::KernelGraph *graph) {
|
|||
save_graphs_path_ = ".";
|
||||
}
|
||||
if (save_graphs_) {
|
||||
std::string file_path = save_graphs_path_ + "/" + "somas_basic_info_" + std::to_string(graph->graph_id()) + ".ir";
|
||||
DumpSomasBasicIR(file_path);
|
||||
std::string file_path = save_graphs_path_ + "/" + "somas_initial_info_" + std::to_string(graph->graph_id()) + ".ir";
|
||||
DumpSomasInfoIR(file_path);
|
||||
}
|
||||
}
|
||||
|
||||
|
@ -281,7 +389,6 @@ void Somas::GetNextOutputProcess(const session::KernelGraph *graph) {
|
|||
}
|
||||
}
|
||||
}
|
||||
|
||||
MS_LOG(INFO) << "Special Tensor total size: GetNext Output " << total_size;
|
||||
}
|
||||
|
||||
|
@ -305,12 +412,6 @@ void Somas::IndependentNodeOutputProcess(const session::KernelGraph *graph) {
|
|||
}
|
||||
|
||||
MS_LOG(INFO) << "Special Tensor total size: Independent Node output " << total_size;
|
||||
|
||||
if (save_graphs_ && total_size) {
|
||||
std::string file_path =
|
||||
save_graphs_path_ + "/" + "Independent_node_process_" + std::to_string(graph->graph_id()) + ".ir";
|
||||
DumpSomasBasicIR(file_path);
|
||||
}
|
||||
}
|
||||
|
||||
void Somas::SummaryInputProcess(const session::KernelGraph *graph) {
|
||||
|
@ -349,12 +450,6 @@ void Somas::SummaryInputProcess(const session::KernelGraph *graph) {
|
|||
}
|
||||
|
||||
MS_LOG(INFO) << "Special Tensor total size: SummaryNodes: " << total_summary_size;
|
||||
|
||||
if (save_graphs_) {
|
||||
std::string file_path =
|
||||
save_graphs_path_ + "/" + "somas_summary_process_" + std::to_string(graph->graph_id()) + ".ir";
|
||||
DumpSomasBasicIR(file_path);
|
||||
}
|
||||
}
|
||||
|
||||
void Somas::RefNodeProcess(const session::KernelGraph *graph) {
|
||||
|
@ -400,12 +495,6 @@ void Somas::RefNodeProcess(const session::KernelGraph *graph) {
|
|||
}
|
||||
|
||||
MS_LOG(INFO) << "Special Tensor total size: RefNode: input " << total_input_size << " output " << total_output_size;
|
||||
|
||||
if (save_graphs_ && (total_input_size || total_output_size)) {
|
||||
std::string file_path =
|
||||
save_graphs_path_ + "/" + "somas_refnode_process_" + std::to_string(graph->graph_id()) + ".ir";
|
||||
DumpSomasBasicIR(file_path);
|
||||
}
|
||||
}
|
||||
|
||||
void Somas::UnReuseNodeProcess(const session::KernelGraph *graph) {
|
||||
|
@ -443,12 +532,6 @@ void Somas::UnReuseNodeProcess(const session::KernelGraph *graph) {
|
|||
}
|
||||
}
|
||||
}
|
||||
|
||||
if (save_graphs_) {
|
||||
std::string file_path =
|
||||
save_graphs_path_ + "/" + "somas_unreuse_node_process_" + std::to_string(graph->graph_id()) + ".ir";
|
||||
DumpSomasBasicIR(file_path);
|
||||
}
|
||||
}
|
||||
|
||||
void Somas::GenContiguousList(const session::KernelGraph *graph) {
|
||||
|
@ -876,7 +959,7 @@ bool Somas::Assign(const session::KernelGraph *graph) {
|
|||
contiguous_tensors_list_removed_ref, false);
|
||||
MS_LOG(INFO) << "End Solving";
|
||||
if (status != SUCCESS) {
|
||||
GenStatisticInfo();
|
||||
GenGraphStatisticInfo();
|
||||
MS_LOG(EXCEPTION) << "SOMAS Solving Failed.";
|
||||
}
|
||||
|
||||
|
@ -912,11 +995,6 @@ bool Somas::Assign(const session::KernelGraph *graph) {
|
|||
// Set mem_offset_ value by solver result
|
||||
mem_offset_ = static_cast<size_t>(somas_solver_->GetMaxOffset());
|
||||
|
||||
if (save_graphs_) {
|
||||
std::string mem_pool_file_path =
|
||||
save_graphs_path_ + "/" + "somas_mem_pool_info_" + std::to_string(graph->graph_id()) + ".ir";
|
||||
DumpSomasMemoryPoolInfoIR(mem_pool_file_path);
|
||||
}
|
||||
return true;
|
||||
}
|
||||
|
||||
|
@ -933,7 +1011,7 @@ std::string Somas::GetSplitName(const std::string &scope_name) const {
|
|||
}
|
||||
}
|
||||
|
||||
void Somas::DumpSomasBasicIR(const string filename) {
|
||||
void Somas::DumpSomasInfoIR(const string filename) {
|
||||
if (filename.size() > PATH_MAX) {
|
||||
MS_LOG(ERROR) << "File path " << filename << " is too long.";
|
||||
return;
|
||||
|
@ -951,16 +1029,38 @@ void Somas::DumpSomasBasicIR(const string filename) {
|
|||
MS_LOG(ERROR) << "Open dump file '" << real_path.value() << "' failed!";
|
||||
return;
|
||||
}
|
||||
ofs << "All Tensors:\n\n";
|
||||
|
||||
ofs << "All Parameters:\n\n";
|
||||
ofs << "index:"
|
||||
<< "\tsize:"
|
||||
<< "\tstart_addr:"
|
||||
<< "\tsource node name:"
|
||||
<< "\tnode out index:\n";
|
||||
|
||||
for (const auto ¶m : parameters_list_) {
|
||||
ofs << "%" << param->id_ << "P"
|
||||
<< "\t"
|
||||
<< "#" << param->size_ << "S"
|
||||
<< "\t"
|
||||
<< "&" << param->addr_ << "\t" << param->source_node_->fullname_with_scope() << "\t" << param->output_index_
|
||||
<< "\n";
|
||||
}
|
||||
|
||||
ofs << "\n\nAll Tensors:\n\n";
|
||||
ofs << "index:"
|
||||
<< "\tsize:"
|
||||
<< "\treal_size:"
|
||||
<< "\toffset:"
|
||||
<< "\taddr:"
|
||||
<< "\ttype:"
|
||||
<< "\tlifelong:\n";
|
||||
<< "\tlifelong:"
|
||||
<< "\tlife_start:"
|
||||
<< "\tlife_end:"
|
||||
<< "\tsource node name:\n";
|
||||
|
||||
for (const auto &tensor : tensors_list_) {
|
||||
auto scope_name = tensor->GetSourceNode()->scope_full_name_;
|
||||
std::string split_name = GetSplitName(scope_name);
|
||||
ofs << "%" << tensor->GetId() << "T"
|
||||
<< "\t"
|
||||
<< "#" << tensor->GetAlignedSize() << "S"
|
||||
|
@ -970,7 +1070,8 @@ void Somas::DumpSomasBasicIR(const string filename) {
|
|||
<< "&" << tensor->GetOffset() << ""
|
||||
<< "\t"
|
||||
<< "&" << static_cast<void *>(tensor->GetOffset() + mem_base_addr_) << "\t"
|
||||
<< tensor_type_name_map[tensor->type_] << "\t" << tensor->IsLifelong() << "\n";
|
||||
<< tensor_type_name_map[tensor->type_] << "\t" << tensor->IsLifelong() << "\t" << tensor->lifetime_.start_
|
||||
<< "\t" << tensor->lifetime_.end_ << "\t" << split_name << "\n";
|
||||
}
|
||||
|
||||
ofs << "\n\nAll Nodes:\n\n";
|
||||
|
@ -978,10 +1079,25 @@ void Somas::DumpSomasBasicIR(const string filename) {
|
|||
auto scope_name = node->scope_full_name_;
|
||||
std::string split_name = GetSplitName(scope_name);
|
||||
ofs << "$" << node->GetId() << "\t" << split_name << "\t" << static_cast<int>(node->GetType()) << "\t";
|
||||
vector<std::pair<string, size_t>> input_list;
|
||||
std::transform(
|
||||
node->input_tensors_.begin(), node->input_tensors_.end(), std::back_inserter(input_list),
|
||||
[](SomasTensorPtr in) -> std::pair<string, size_t> { return std::make_pair("Tensor", in->GetId()); });
|
||||
for (const auto ¶m : node->input_parameters_map_) {
|
||||
auto index = param.first;
|
||||
auto iter = input_list.begin();
|
||||
std::advance(iter, index);
|
||||
input_list.insert(iter, std::make_pair("Parameter", param.second->id_));
|
||||
}
|
||||
ofs << "inputs[";
|
||||
for (const auto &in : node->input_tensors_) {
|
||||
ofs << "%" << in->GetId() << "T"
|
||||
for (const auto &in : input_list) {
|
||||
if (in.first == "Tensor") {
|
||||
ofs << "%" << in.second << "T"
|
||||
<< ", ";
|
||||
} else if (in.first == "Parameter") {
|
||||
ofs << "%" << in.second << "P"
|
||||
<< ", ";
|
||||
}
|
||||
}
|
||||
ofs << "]";
|
||||
ofs << "\toutputs[";
|
||||
|
@ -1008,6 +1124,7 @@ void Somas::DumpSomasBasicIR(const string filename) {
|
|||
ofs << "\n";
|
||||
}
|
||||
|
||||
if (!ref_node_constraints_.empty()) {
|
||||
ofs << "\n\nAll Ref Node Info:\n\n";
|
||||
for (const auto &ref_in_out : ref_node_constraints_) {
|
||||
ofs << "refnode input-output:";
|
||||
|
@ -1017,6 +1134,7 @@ void Somas::DumpSomasBasicIR(const string filename) {
|
|||
ofs << "\n";
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
void Somas::DumpOfflineIR(const string filename) {
|
||||
MS_LOG(INFO) << "Printing somas-log-from-graph log: " << filename;
|
||||
|
@ -1197,115 +1315,7 @@ size_t Somas::CalcLowerBound() const {
|
|||
return max_lifetime;
|
||||
}
|
||||
|
||||
void Somas::DumpSomasMemoryPoolInfoIR(const string filename) {
|
||||
if (filename.size() > PATH_MAX) {
|
||||
MS_LOG(ERROR) << "File path " << filename << " is too long.";
|
||||
return;
|
||||
}
|
||||
|
||||
auto real_path = Common::GetRealPath(filename);
|
||||
if (!real_path.has_value()) {
|
||||
MS_LOG(ERROR) << "Get real path failed. path=" << filename;
|
||||
return;
|
||||
}
|
||||
|
||||
ChangeFileMode(real_path.value(), S_IRWXU);
|
||||
std::ofstream ofs(real_path.value());
|
||||
|
||||
if (!ofs.is_open()) {
|
||||
MS_LOG(ERROR) << "Open dump file '" << real_path.value() << "' failed!";
|
||||
return;
|
||||
}
|
||||
|
||||
ofs << "Total Dynamic Size (Upper Bound):\t" << upper_bound_ << "\n"
|
||||
<< "Theoretical Optimal Size (Lower Bound):\t" << lower_bound_ << "\n"
|
||||
<< "Total Workspace Size:\t" << workspace_total_size_ << "\n"
|
||||
<< "Total Communication Input Tensor Size:\t" << comm_input_total_size_ << "\n"
|
||||
<< "Total Communication Output Tensor Size:\t" << comm_output_total_size_ << "\n"
|
||||
<< "Total LifeLong All Tensor Size:\t" << lifelong_all_total_size_ << "\n"
|
||||
<< "Total LifeLong Start Tensor Size:\t" << lifelong_start_total_size_ << "\n"
|
||||
<< "Total LifeLong End Tensor Size:\t" << lifelong_end_total_size_ << "\n"
|
||||
<< "Reused Size(Allocate Size):\t" << GetTotalMemSize() << "\n\n\n";
|
||||
|
||||
std::map<size_t, size_t> mem_map;
|
||||
for (auto tensor : tensors_list_) {
|
||||
mem_map[tensor->GetOffset()] = 0;
|
||||
}
|
||||
|
||||
size_t num = 0;
|
||||
for (auto iter = mem_map.begin(); iter != mem_map.end(); ++iter, ++num) {
|
||||
iter->second = num;
|
||||
}
|
||||
|
||||
std::map<size_t, bool> tensor_mask;
|
||||
for (size_t i = 0; i < tensors_list_.size(); ++i) {
|
||||
tensor_mask[i] = false;
|
||||
}
|
||||
|
||||
std::vector<SomasTensorPtr> order_tensors_list = tensors_list_;
|
||||
std::sort(order_tensors_list.begin(), order_tensors_list.end(),
|
||||
[](const SomasTensorPtr tensor1, const SomasTensorPtr tensor2) {
|
||||
return tensor1->GetOffset() < tensor2->GetOffset();
|
||||
});
|
||||
|
||||
size_t cur_total_tensor_size = 0;
|
||||
for (const auto &node : nodes_list_) {
|
||||
if (node == nullptr) {
|
||||
MS_LOG(WARNING) << "Node is NULL, No ir information output";
|
||||
continue;
|
||||
}
|
||||
ofs << "node_name: " << GetSplitName(node->scope_full_name_) << "\tnode_id: " << node->GetId() << "\n";
|
||||
ofs << "mem_id\t"
|
||||
<< "mem_head\t"
|
||||
<< "mem_tail\t"
|
||||
<< "node_id\t"
|
||||
<< "stream_id\t"
|
||||
<< "tensor_id\t"
|
||||
<< "tensor_type\t"
|
||||
<< "lifelong\t"
|
||||
<< "origin_size\t"
|
||||
<< "align_size\t"
|
||||
<< "source_node\t"
|
||||
<< "lifetime_start\t"
|
||||
<< "lifetime_end\t\n";
|
||||
|
||||
size_t cur_alive_tensor_size = 0;
|
||||
size_t curr_runtime = node->GetId();
|
||||
for (size_t i = 0; i < order_tensors_list.size(); ++i) {
|
||||
auto tensor = order_tensors_list[i];
|
||||
if (tensor->lifetime_.start_ <= curr_runtime && tensor->lifetime_.end_ >= curr_runtime) {
|
||||
cur_alive_tensor_size += tensor->aligned_size_;
|
||||
if (!tensor_mask[i]) {
|
||||
cur_total_tensor_size += tensor->aligned_size_;
|
||||
tensor_mask[i] = true;
|
||||
}
|
||||
std::string scope_name;
|
||||
size_t src_node_id = 0xffff;
|
||||
size_t tensor_stream_id = 0xffff;
|
||||
if (tensor->GetSourceNode() != nullptr) {
|
||||
scope_name = tensor->GetSourceNode()->scope_full_name_;
|
||||
src_node_id = tensor->GetSourceNode()->GetId();
|
||||
tensor_stream_id = tensor->GetSourceNode()->GetId();
|
||||
} else {
|
||||
scope_name = "Somas Tensor";
|
||||
}
|
||||
std::string split_name = GetSplitName(scope_name);
|
||||
|
||||
ofs << "&" << mem_map[tensor->GetOffset()] << "\t" << tensor->GetOffset() << "\t"
|
||||
<< tensor->GetOffset() + tensor->GetAlignedSize() << "\t"
|
||||
<< "\t#" << src_node_id << "\t@" << tensor_stream_id << "\t%" << tensor->GetId() << "T\t"
|
||||
<< tensor_type_name_map[tensor->type_] << "\t" << static_cast<int>(tensor->lifelong_value_) << "\t"
|
||||
<< tensor->GetOriginalSize() << "\t" << tensor->GetAlignedSize() << "\t"
|
||||
<< "\t" << split_name << "\t" << tensor->lifetime_.start_ << "\t" << tensor->lifetime_.end_ << "\n";
|
||||
}
|
||||
}
|
||||
ofs << "Current Alive Tensor Size(Lower Bound):\t" << cur_alive_tensor_size << "\n"
|
||||
<< "Current Total Tensor Size(Upper Bound):\t" << cur_total_tensor_size << "\n\n";
|
||||
}
|
||||
ofs.close();
|
||||
}
|
||||
|
||||
void Somas::GenStatisticInfo() {
|
||||
void Somas::GenGraphStatisticInfo() {
|
||||
lower_bound_ = CalcLowerBound();
|
||||
for (const auto &tensor : tensors_list_) {
|
||||
upper_bound_ += tensor->aligned_size_;
|
||||
|
|
|
@ -29,6 +29,7 @@
|
|||
#include "backend/optimizer/somas/somas_node.h"
|
||||
#include "backend/optimizer/somas/somas_solver_pre.h"
|
||||
#include "backend/optimizer/somas/somas_stream.h"
|
||||
#include "backend/optimizer/somas/somas_parameter.h"
|
||||
#include "backend/session/anf_runtime_algorithm.h"
|
||||
#include "backend/session/kernel_graph.h"
|
||||
|
||||
|
@ -48,7 +49,7 @@ class Somas {
|
|||
uint8_t *GetNodeOutputPtr(const AnfNodePtr &node, size_t index) const;
|
||||
uint8_t *GetNodeWorkSpacePtr(const AnfNodePtr &node, size_t index) const;
|
||||
|
||||
void DumpSomasBasicIR(const string filename);
|
||||
void DumpSomasInfoIR(const string filename);
|
||||
void DumpSomasMemoryIR(const string filename);
|
||||
|
||||
static bool NodeSort(SomasNodePtr, SomasNodePtr);
|
||||
|
@ -58,11 +59,13 @@ class Somas {
|
|||
// Maps
|
||||
std::unordered_map<size_t, SomasTensorPtr> tensors_map_;
|
||||
std::map<void *, SomasNodePtr> nodes_map_;
|
||||
std::map<void *, vector<SomasParameterPtr>> parameters_map_;
|
||||
|
||||
// Vectors
|
||||
std::vector<SomasNodePtr> nodes_list_;
|
||||
std::vector<SomasStreamPtr> streams_list_;
|
||||
std::vector<SomasTensorPtr> tensors_list_;
|
||||
std::vector<SomasParameterPtr> parameters_list_;
|
||||
|
||||
// Stream groups
|
||||
std::vector<vector<uint32_t>> streams_groups_;
|
||||
|
@ -120,7 +123,11 @@ class Somas {
|
|||
void DumpSomasMemoryPoolInfoIR(const string filename);
|
||||
std::string GetSplitName(const string &scope_name) const;
|
||||
size_t CalcLowerBound() const;
|
||||
void GenStatisticInfo();
|
||||
void GenGraphStatisticInfo();
|
||||
SomasParameterPtr GetSomasParameters(AnfNodePtr node, size_t index);
|
||||
SomasParameterPtr CreateSomasParameters(AnfNodePtr node, size_t index);
|
||||
void InitCommonNodeInputs(bool is_all_nop_node, const CNodePtr &kernel);
|
||||
void InitAtomicCleanInputs(bool is_all_nop_node, const CNodePtr &kernel);
|
||||
};
|
||||
|
||||
using SomasPtr = std::shared_ptr<Somas>;
|
||||
|
|
|
@ -19,8 +19,10 @@
|
|||
|
||||
#include "backend/optimizer/somas/somas_stream.h"
|
||||
#include "backend/optimizer/somas/somas_tensor.h"
|
||||
#include "backend/optimizer/somas/somas_parameter.h"
|
||||
|
||||
#include <memory>
|
||||
#include <map>
|
||||
#include <set>
|
||||
#include <string>
|
||||
#include <unordered_map>
|
||||
|
@ -49,6 +51,7 @@ class SomasNode {
|
|||
std::vector<SomasTensorPtr> input_tensors_;
|
||||
std::vector<SomasTensorPtr> output_tensors_;
|
||||
std::vector<SomasTensorPtr> workspace_tensors_;
|
||||
std::map<size_t, SomasParameterPtr> input_parameters_map_;
|
||||
|
||||
std::unordered_map<int64_t, size_t> anc_stream_max_order_;
|
||||
|
||||
|
|
|
@ -0,0 +1,41 @@
|
|||
/**
|
||||
* Copyright 2021 Huawei Technologies Co., Ltd
|
||||
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
#ifndef MINDSPORE_CCSRC_BACKEND_OPTIMIZER_SOMAS_SOMAS_PARAMETER_H_
|
||||
#define MINDSPORE_CCSRC_BACKEND_OPTIMIZER_SOMAS_SOMAS_PARAMETER_H_
|
||||
|
||||
#include <memory>
|
||||
#include "base/base.h"
|
||||
|
||||
namespace mindspore {
|
||||
namespace somas {
|
||||
class SomasParameter {
|
||||
public:
|
||||
SomasParameter(size_t id, AnfNodePtr source_node, size_t index, const void *addr, size_t size)
|
||||
: id_(id), source_node_(source_node), output_index_(index), addr_(const_cast<void *>(addr)), size_(size) {}
|
||||
~SomasParameter() = default;
|
||||
|
||||
const size_t id_{0};
|
||||
AnfNodePtr source_node_;
|
||||
size_t output_index_;
|
||||
void *addr_;
|
||||
size_t size_;
|
||||
};
|
||||
using SomasParameterPtr = std::shared_ptr<SomasParameter>;
|
||||
} // namespace somas
|
||||
} // namespace mindspore
|
||||
|
||||
#endif // MINDSPORE_CCSRC_BACKEND_OPTIMIZER_SOMAS_SOMAS_PARAMETER_H_
|
|
@ -73,9 +73,8 @@ void MemoryManager::MallocSomasDynamicMem(const session::KernelGraph *graph) {
|
|||
save_graphs_path = ".";
|
||||
}
|
||||
if (save_graphs) {
|
||||
std::string file_path =
|
||||
save_graphs_path + "/" + "somas_after_allocate_" + std::to_string(graph->graph_id()) + ".ir";
|
||||
somas_reuse_util_ptr_->DumpSomasBasicIR(file_path);
|
||||
std::string file_path = save_graphs_path + "/" + "somas_allocate_info_" + std::to_string(graph->graph_id()) + ".ir";
|
||||
somas_reuse_util_ptr_->DumpSomasInfoIR(file_path);
|
||||
|
||||
std::string mem_file_path = save_graphs_path + "/" + "somas_mem_info_" + std::to_string(graph->graph_id()) + ".ir";
|
||||
somas_reuse_util_ptr_->DumpSomasMemoryIR(mem_file_path);
|
||||
|
|
Loading…
Reference in New Issue