forked from mindspore-Ecosystem/mindspore
!23207 Adding security isolation to debugger
Merge pull request !23207 from sabrinasun_59ee/macro
This commit is contained in:
commit
dc45c64a78
|
@ -55,11 +55,13 @@ install(
|
||||||
COMPONENT mindspore
|
COMPONENT mindspore
|
||||||
)
|
)
|
||||||
|
|
||||||
install(
|
if(ENABLE_DEBUGGER)
|
||||||
|
install(
|
||||||
TARGETS _mindspore_offline_debug
|
TARGETS _mindspore_offline_debug
|
||||||
DESTINATION ${INSTALL_BASE_DIR}
|
DESTINATION ${INSTALL_BASE_DIR}
|
||||||
COMPONENT mindspore
|
COMPONENT mindspore
|
||||||
)
|
)
|
||||||
|
endif()
|
||||||
|
|
||||||
install(
|
install(
|
||||||
TARGETS mindspore_shared_lib
|
TARGETS mindspore_shared_lib
|
||||||
|
|
|
@ -56,15 +56,15 @@
|
||||||
#include "runtime/device/kernel_runtime_manager.h"
|
#include "runtime/device/kernel_runtime_manager.h"
|
||||||
#include "utils/config_manager.h"
|
#include "utils/config_manager.h"
|
||||||
#include "debug/data_dump/dump_json_parser.h"
|
#include "debug/data_dump/dump_json_parser.h"
|
||||||
#include "debug/tensor_load.h"
|
#include "debug/data_dump/e2e_dump.h"
|
||||||
#include "debug/anf_ir_utils.h"
|
#include "debug/anf_ir_utils.h"
|
||||||
#include "backend/optimizer/graph_kernel/graph_kernel_optimization.h"
|
#include "backend/optimizer/graph_kernel/graph_kernel_optimization.h"
|
||||||
#include "backend/session/ascend_auto_monad.h"
|
#include "backend/session/ascend_auto_monad.h"
|
||||||
#include "debug/data_dump/e2e_dump.h"
|
|
||||||
#include "debug/anf_ir_dump.h"
|
#include "debug/anf_ir_dump.h"
|
||||||
#include "debug/dump_proto.h"
|
#include "debug/dump_proto.h"
|
||||||
#include "abstract/utils.h"
|
#include "abstract/utils.h"
|
||||||
#ifdef ENABLE_DEBUGGER
|
#ifdef ENABLE_DEBUGGER
|
||||||
|
#include "debug/tensor_load.h"
|
||||||
#include "debug/debugger/proto_exporter.h"
|
#include "debug/debugger/proto_exporter.h"
|
||||||
#else
|
#else
|
||||||
#include "debug/debugger/proto_exporter_stub.h"
|
#include "debug/debugger/proto_exporter_stub.h"
|
||||||
|
@ -520,10 +520,12 @@ GraphId AscendSession::CompileGraphImpl(NotNull<FuncGraphPtr> func_graph) {
|
||||||
|
|
||||||
HardwareOptimize(NOT_NULL(root_graph), NOT_NULL(&memo));
|
HardwareOptimize(NOT_NULL(root_graph), NOT_NULL(&memo));
|
||||||
memo.clear();
|
memo.clear();
|
||||||
|
#ifdef ENABLE_DEBUGGER
|
||||||
// load graphs to debugger.
|
// load graphs to debugger.
|
||||||
if (debugger_ && debugger_->DebuggerBackendEnabled()) {
|
if (debugger_ && debugger_->DebuggerBackendEnabled()) {
|
||||||
LoadGraphsToDbg(NOT_NULL(root_graph), NOT_NULL(&memo));
|
LoadGraphsToDbg(NOT_NULL(root_graph), NOT_NULL(&memo));
|
||||||
}
|
}
|
||||||
|
#endif
|
||||||
memo.clear();
|
memo.clear();
|
||||||
UpdateRefOutputMap(NOT_NULL(root_graph), NOT_NULL(&memo));
|
UpdateRefOutputMap(NOT_NULL(root_graph), NOT_NULL(&memo));
|
||||||
memo.clear();
|
memo.clear();
|
||||||
|
@ -553,9 +555,11 @@ GraphId AscendSession::CompileGraphImpl(NotNull<FuncGraphPtr> func_graph) {
|
||||||
device::KernelAdjust::GetInstance().InsertOverflowCheckOperations(NOT_NULL(root_graph));
|
device::KernelAdjust::GetInstance().InsertOverflowCheckOperations(NOT_NULL(root_graph));
|
||||||
// build kernel
|
// build kernel
|
||||||
BuildKernel(root_graph);
|
BuildKernel(root_graph);
|
||||||
|
#ifdef ENABLE_DEBUGGER
|
||||||
if (debugger_ && debugger_->partial_memory()) {
|
if (debugger_ && debugger_->partial_memory()) {
|
||||||
debugger_->PreExecute(root_graph);
|
debugger_->PreExecute(root_graph);
|
||||||
}
|
}
|
||||||
|
#endif
|
||||||
SetSummaryNodes(root_graph.get());
|
SetSummaryNodes(root_graph.get());
|
||||||
// Alloc memory for child graph's inputs
|
// Alloc memory for child graph's inputs
|
||||||
AssignStaticMemory(NOT_NULL(root_graph), NOT_NULL(&memo));
|
AssignStaticMemory(NOT_NULL(root_graph), NOT_NULL(&memo));
|
||||||
|
@ -568,6 +572,7 @@ GraphId AscendSession::CompileGraphImpl(NotNull<FuncGraphPtr> func_graph) {
|
||||||
root_graph->SetOptimizerFlag();
|
root_graph->SetOptimizerFlag();
|
||||||
DumpAllGraphs(all_graphs);
|
DumpAllGraphs(all_graphs);
|
||||||
// Save memory profiling data to proto file
|
// Save memory profiling data to proto file
|
||||||
|
#ifndef ENABLE_SECURITY
|
||||||
auto profiling_instance = MemoryProfiling::GetInstance();
|
auto profiling_instance = MemoryProfiling::GetInstance();
|
||||||
if (profiling_instance.IsMemoryProfilingEnable()) {
|
if (profiling_instance.IsMemoryProfilingEnable()) {
|
||||||
auto runtime_instance = device::KernelRuntimeManager::Instance().GetKernelRuntime(kAscendDevice, device_id_);
|
auto runtime_instance = device::KernelRuntimeManager::Instance().GetKernelRuntime(kAscendDevice, device_id_);
|
||||||
|
@ -576,6 +581,7 @@ GraphId AscendSession::CompileGraphImpl(NotNull<FuncGraphPtr> func_graph) {
|
||||||
profiling_instance.SetDeviceMemSize(mem_size);
|
profiling_instance.SetDeviceMemSize(mem_size);
|
||||||
profiling_instance.SaveMemoryProfiling();
|
profiling_instance.SaveMemoryProfiling();
|
||||||
}
|
}
|
||||||
|
#endif
|
||||||
// return the root_graph id to backend
|
// return the root_graph id to backend
|
||||||
auto graph_id = root_graph->graph_id();
|
auto graph_id = root_graph->graph_id();
|
||||||
return graph_id;
|
return graph_id;
|
||||||
|
@ -628,9 +634,11 @@ void AscendSession::BuildGraphImpl(GraphId graph_id) {
|
||||||
BuildKernel(graph);
|
BuildKernel(graph);
|
||||||
auto ms_context = MsContext::GetInstance();
|
auto ms_context = MsContext::GetInstance();
|
||||||
MS_EXCEPTION_IF_NULL(ms_context);
|
MS_EXCEPTION_IF_NULL(ms_context);
|
||||||
|
#ifdef ENABLE_DEBUGGER
|
||||||
if (debugger_ && debugger_->partial_memory()) {
|
if (debugger_ && debugger_->partial_memory()) {
|
||||||
debugger_->PreExecute(graph);
|
debugger_->PreExecute(graph);
|
||||||
}
|
}
|
||||||
|
#endif
|
||||||
if (ms_context->get_param<bool>(MS_CTX_PRECOMPILE_ONLY)) {
|
if (ms_context->get_param<bool>(MS_CTX_PRECOMPILE_ONLY)) {
|
||||||
MS_LOG(INFO) << "Precompile only, stop in build kernel step";
|
MS_LOG(INFO) << "Precompile only, stop in build kernel step";
|
||||||
} else {
|
} else {
|
||||||
|
@ -677,9 +685,11 @@ bool AscendSession::IsSupportSummary() { return !device::KernelAdjust::NeedInser
|
||||||
|
|
||||||
void AscendSession::PreExecuteGraph(const std::shared_ptr<KernelGraph> &kernel_graph,
|
void AscendSession::PreExecuteGraph(const std::shared_ptr<KernelGraph> &kernel_graph,
|
||||||
const std::vector<tensor::TensorPtr> &inputs, VectorRef *const) {
|
const std::vector<tensor::TensorPtr> &inputs, VectorRef *const) {
|
||||||
|
#ifdef ENABLE_DEBUGGER
|
||||||
if (debugger_) {
|
if (debugger_) {
|
||||||
debugger_->PreExecute(kernel_graph);
|
debugger_->PreExecute(kernel_graph);
|
||||||
}
|
}
|
||||||
|
#endif
|
||||||
#if ENABLE_CPU && ENABLE_D
|
#if ENABLE_CPU && ENABLE_D
|
||||||
// Initialize parameter server
|
// Initialize parameter server
|
||||||
InitPSParamAndOptim(kernel_graph, inputs);
|
InitPSParamAndOptim(kernel_graph, inputs);
|
||||||
|
@ -694,6 +704,7 @@ void AscendSession::PostExecuteGraph(const std::shared_ptr<KernelGraph> &kernel_
|
||||||
const std::vector<tensor::TensorPtr> &, VectorRef *const) {
|
const std::vector<tensor::TensorPtr> &, VectorRef *const) {
|
||||||
// summary
|
// summary
|
||||||
Summary(kernel_graph.get());
|
Summary(kernel_graph.get());
|
||||||
|
#ifdef ENABLE_DEBUGGER
|
||||||
// load tensor from device for debugger
|
// load tensor from device for debugger
|
||||||
if (debugger_ && debugger_->debugger_enabled()) {
|
if (debugger_ && debugger_->debugger_enabled()) {
|
||||||
LoadTensor(kernel_graph);
|
LoadTensor(kernel_graph);
|
||||||
|
@ -702,6 +713,7 @@ void AscendSession::PostExecuteGraph(const std::shared_ptr<KernelGraph> &kernel_
|
||||||
if (debugger_) {
|
if (debugger_) {
|
||||||
debugger_->PostExecute();
|
debugger_->PostExecute();
|
||||||
}
|
}
|
||||||
|
#endif
|
||||||
}
|
}
|
||||||
|
|
||||||
void AscendSession::ExecuteGraph(const std::shared_ptr<KernelGraph> &kernel_graph) { Execute(kernel_graph, true); }
|
void AscendSession::ExecuteGraph(const std::shared_ptr<KernelGraph> &kernel_graph) { Execute(kernel_graph, true); }
|
||||||
|
@ -1759,6 +1771,7 @@ void AscendSession::HardwareOptimize(NotNull<KernelGraphPtr> graph,
|
||||||
MS_LOG(INFO) << "Finish doing HardwareOptimize in graph: " << graph->graph_id();
|
MS_LOG(INFO) << "Finish doing HardwareOptimize in graph: " << graph->graph_id();
|
||||||
}
|
}
|
||||||
|
|
||||||
|
#ifdef ENABLE_DEBUGGER
|
||||||
void AscendSession::LoadGraphsToDbg(NotNull<KernelGraphPtr> graph,
|
void AscendSession::LoadGraphsToDbg(NotNull<KernelGraphPtr> graph,
|
||||||
NotNull<std::set<KernelGraphPtr> *> const memo) const {
|
NotNull<std::set<KernelGraphPtr> *> const memo) const {
|
||||||
if (memo->find(graph) != memo->end()) {
|
if (memo->find(graph) != memo->end()) {
|
||||||
|
@ -1775,6 +1788,7 @@ void AscendSession::LoadGraphsToDbg(NotNull<KernelGraphPtr> graph,
|
||||||
}
|
}
|
||||||
MS_LOG(INFO) << "Finish doing LoadGraphsToDbg in graph: " << graph->graph_id();
|
MS_LOG(INFO) << "Finish doing LoadGraphsToDbg in graph: " << graph->graph_id();
|
||||||
}
|
}
|
||||||
|
#endif
|
||||||
|
|
||||||
void AscendSession::AssignStaticMemory(NotNull<KernelGraphPtr> graph,
|
void AscendSession::AssignStaticMemory(NotNull<KernelGraphPtr> graph,
|
||||||
NotNull<std::set<KernelGraphPtr> *> const memo) const {
|
NotNull<std::set<KernelGraphPtr> *> const memo) const {
|
||||||
|
|
|
@ -133,7 +133,9 @@ class AscendSession : public SessionBasic {
|
||||||
size_t *const raise_precision_count, size_t *const reduce_precision_count) const;
|
size_t *const raise_precision_count, size_t *const reduce_precision_count) const;
|
||||||
void IrFusionPass(const NotNull<KernelGraphPtr> graph, NotNull<std::set<KernelGraphPtr> *> memo);
|
void IrFusionPass(const NotNull<KernelGraphPtr> graph, NotNull<std::set<KernelGraphPtr> *> memo);
|
||||||
void HardwareOptimize(const NotNull<KernelGraphPtr> graph, NotNull<std::set<KernelGraphPtr> *> memo) const;
|
void HardwareOptimize(const NotNull<KernelGraphPtr> graph, NotNull<std::set<KernelGraphPtr> *> memo) const;
|
||||||
|
#ifdef ENABLE_DEBUGGER
|
||||||
void LoadGraphsToDbg(const NotNull<KernelGraphPtr> graph, NotNull<std::set<KernelGraphPtr> *> memo) const;
|
void LoadGraphsToDbg(const NotNull<KernelGraphPtr> graph, NotNull<std::set<KernelGraphPtr> *> memo) const;
|
||||||
|
#endif
|
||||||
void AssignStaticMemory(const NotNull<KernelGraphPtr> graph, NotNull<std::set<KernelGraphPtr> *> memo) const;
|
void AssignStaticMemory(const NotNull<KernelGraphPtr> graph, NotNull<std::set<KernelGraphPtr> *> memo) const;
|
||||||
void UpdateRefOutputMap(const NotNull<KernelGraphPtr> graph, NotNull<std::set<KernelGraphPtr> *> memo) const;
|
void UpdateRefOutputMap(const NotNull<KernelGraphPtr> graph, NotNull<std::set<KernelGraphPtr> *> memo) const;
|
||||||
void CacheCNodeOutputInfo(const KernelGraph &graph) const;
|
void CacheCNodeOutputInfo(const KernelGraph &graph) const;
|
||||||
|
|
|
@ -57,16 +57,16 @@
|
||||||
#include "backend/optimizer/pass/optimize_updatestate.h"
|
#include "backend/optimizer/pass/optimize_updatestate.h"
|
||||||
#include "common/trans.h"
|
#include "common/trans.h"
|
||||||
#include "debug/anf_ir_dump.h"
|
#include "debug/anf_ir_dump.h"
|
||||||
#include "debug/data_dump/e2e_dump.h"
|
#include "debug/dump_proto.h"
|
||||||
#ifdef ENABLE_DEBUGGER
|
#ifdef ENABLE_DEBUGGER
|
||||||
|
#include "debug/data_dump/e2e_dump.h"
|
||||||
|
#include "debug/data_dump/dump_json_parser.h"
|
||||||
#include "debug/debugger/proto_exporter.h"
|
#include "debug/debugger/proto_exporter.h"
|
||||||
|
#include "debug/data_dump/dump_utils.h"
|
||||||
|
#include "debug/tensor_load.h"
|
||||||
#else
|
#else
|
||||||
#include "debug/debugger/proto_exporter_stub.h"
|
#include "debug/debugger/proto_exporter_stub.h"
|
||||||
#endif
|
#endif
|
||||||
#include "debug/data_dump/dump_json_parser.h"
|
|
||||||
#include "debug/data_dump/dump_utils.h"
|
|
||||||
#include "debug/tensor_load.h"
|
|
||||||
#include "debug/dump_proto.h"
|
|
||||||
#include "runtime/device/gpu/gpu_kernel_build.h"
|
#include "runtime/device/gpu/gpu_kernel_build.h"
|
||||||
#include "runtime/device/gpu/gpu_kernel_runtime.h"
|
#include "runtime/device/gpu/gpu_kernel_runtime.h"
|
||||||
#include "runtime/device/gpu/gpu_stream_assign.h"
|
#include "runtime/device/gpu/gpu_stream_assign.h"
|
||||||
|
@ -123,11 +123,12 @@ void GPUSession::Init(uint32_t device_id) {
|
||||||
rank_id_ = GetRankId();
|
rank_id_ = GetRankId();
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
#ifndef ENABLE_SECURITY
|
||||||
auto &json_parser = DumpJsonParser::GetInstance();
|
auto &json_parser = DumpJsonParser::GetInstance();
|
||||||
// Dump json config file if dump is enabled
|
// Dump json config file if dump is enabled
|
||||||
json_parser.CopyJsonToDir(rank_id_);
|
json_parser.CopyJsonToDir(rank_id_);
|
||||||
json_parser.CopyMSCfgJsonToDir(rank_id_);
|
json_parser.CopyMSCfgJsonToDir(rank_id_);
|
||||||
|
#endif
|
||||||
MS_LOG(INFO) << "Set device id " << device_id << " for gpu session.";
|
MS_LOG(INFO) << "Set device id " << device_id << " for gpu session.";
|
||||||
InitExecutor(kGPUDevice, device_id);
|
InitExecutor(kGPUDevice, device_id);
|
||||||
}
|
}
|
||||||
|
@ -403,8 +404,10 @@ GraphId GPUSession::CompileGraphImpl(KernelGraphPtr graph) {
|
||||||
bool save_graphs = context_ptr->get_param<bool>(MS_CTX_SAVE_GRAPHS_FLAG);
|
bool save_graphs = context_ptr->get_param<bool>(MS_CTX_SAVE_GRAPHS_FLAG);
|
||||||
auto runtime_instance = device::KernelRuntimeManager::Instance().GetSingleKernelRuntime(kGPUDevice, device_id_);
|
auto runtime_instance = device::KernelRuntimeManager::Instance().GetSingleKernelRuntime(kGPUDevice, device_id_);
|
||||||
MS_EXCEPTION_IF_NULL(runtime_instance);
|
MS_EXCEPTION_IF_NULL(runtime_instance);
|
||||||
|
#ifndef ENABLE_SECURITY
|
||||||
auto &json_parser = DumpJsonParser::GetInstance();
|
auto &json_parser = DumpJsonParser::GetInstance();
|
||||||
json_parser.Parse();
|
json_parser.Parse();
|
||||||
|
#endif
|
||||||
// Dump .pb graph before graph optimization
|
// Dump .pb graph before graph optimization
|
||||||
if (save_graphs) {
|
if (save_graphs) {
|
||||||
DumpIRProto(graph, "before_opt_" + std::to_string(graph->graph_id()));
|
DumpIRProto(graph, "before_opt_" + std::to_string(graph->graph_id()));
|
||||||
|
@ -454,6 +457,7 @@ GraphId GPUSession::CompileGraphImpl(KernelGraphPtr graph) {
|
||||||
if (save_graphs) {
|
if (save_graphs) {
|
||||||
DumpIRProto(graph, "after_opt_" + std::to_string(graph->graph_id()));
|
DumpIRProto(graph, "after_opt_" + std::to_string(graph->graph_id()));
|
||||||
}
|
}
|
||||||
|
#ifndef ENABLE_SECURITY
|
||||||
if (json_parser.e2e_dump_enabled()) {
|
if (json_parser.e2e_dump_enabled()) {
|
||||||
graph->set_root_graph_id(graph->graph_id());
|
graph->set_root_graph_id(graph->graph_id());
|
||||||
std::string final_graph = "trace_code_graph_" + std::to_string(graph->graph_id());
|
std::string final_graph = "trace_code_graph_" + std::to_string(graph->graph_id());
|
||||||
|
@ -465,6 +469,7 @@ GraphId GPUSession::CompileGraphImpl(KernelGraphPtr graph) {
|
||||||
DumpGraphExeOrder("ms_execution_order_graph_" + std::to_string(graph->graph_id()) + ".csv", root_dir,
|
DumpGraphExeOrder("ms_execution_order_graph_" + std::to_string(graph->graph_id()) + ".csv", root_dir,
|
||||||
graph->execution_order());
|
graph->execution_order());
|
||||||
}
|
}
|
||||||
|
#endif
|
||||||
// Set graph manager.
|
// Set graph manager.
|
||||||
MS_EXCEPTION_IF_NULL(context_);
|
MS_EXCEPTION_IF_NULL(context_);
|
||||||
FuncGraphManagerPtr manager = MakeManager({graph});
|
FuncGraphManagerPtr manager = MakeManager({graph});
|
||||||
|
@ -493,11 +498,13 @@ GraphId GPUSession::CompileGraphImpl(KernelGraphPtr graph) {
|
||||||
|
|
||||||
void GPUSession::PreExecuteGraph(const std::shared_ptr<KernelGraph> &kernel_graph,
|
void GPUSession::PreExecuteGraph(const std::shared_ptr<KernelGraph> &kernel_graph,
|
||||||
const std::vector<tensor::TensorPtr> &inputs, VectorRef *outputs) {
|
const std::vector<tensor::TensorPtr> &inputs, VectorRef *outputs) {
|
||||||
|
#ifdef ENABLE_DEBUGGER
|
||||||
if (debugger_) {
|
if (debugger_) {
|
||||||
debugger_->PreExecute(kernel_graph);
|
debugger_->PreExecute(kernel_graph);
|
||||||
}
|
}
|
||||||
|
|
||||||
DumpSetup(kernel_graph);
|
DumpSetup(kernel_graph);
|
||||||
|
#endif
|
||||||
|
|
||||||
#if ENABLE_CPU && ENABLE_GPU
|
#if ENABLE_CPU && ENABLE_GPU
|
||||||
// Initialize parameter server
|
// Initialize parameter server
|
||||||
|
@ -513,7 +520,7 @@ void GPUSession::PostExecuteGraph(const std::shared_ptr<KernelGraph> &kernel_gra
|
||||||
if (context_ptr->get_param<bool>(MS_CTX_ENABLE_GPU_SUMMARY)) {
|
if (context_ptr->get_param<bool>(MS_CTX_ENABLE_GPU_SUMMARY)) {
|
||||||
Summary(kernel_graph.get());
|
Summary(kernel_graph.get());
|
||||||
}
|
}
|
||||||
|
#ifdef ENABLE_DEBUGGER
|
||||||
if (debugger_ && debugger_->DebuggerBackendEnabled()) {
|
if (debugger_ && debugger_->DebuggerBackendEnabled()) {
|
||||||
debugger_->LoadParametersAndConst(kernel_graph);
|
debugger_->LoadParametersAndConst(kernel_graph);
|
||||||
}
|
}
|
||||||
|
@ -526,6 +533,7 @@ void GPUSession::PostExecuteGraph(const std::shared_ptr<KernelGraph> &kernel_gra
|
||||||
if (debugger_) {
|
if (debugger_) {
|
||||||
debugger_->PostExecute();
|
debugger_->PostExecute();
|
||||||
}
|
}
|
||||||
|
#endif
|
||||||
}
|
}
|
||||||
|
|
||||||
void GPUSession::ExecuteGraph(const std::shared_ptr<KernelGraph> &kernel_graph) {
|
void GPUSession::ExecuteGraph(const std::shared_ptr<KernelGraph> &kernel_graph) {
|
||||||
|
@ -683,6 +691,7 @@ void GPUSession::RunOpImpl(const GraphInfo &graph_info, OpRunInfo *op_run_info,
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
#ifdef ENABLE_DEBUGGER
|
||||||
void GPUSession::DumpSetup(const std::shared_ptr<KernelGraph> &kernel_graph) const {
|
void GPUSession::DumpSetup(const std::shared_ptr<KernelGraph> &kernel_graph) const {
|
||||||
MS_LOG(INFO) << "Start!";
|
MS_LOG(INFO) << "Start!";
|
||||||
MS_EXCEPTION_IF_NULL(kernel_graph);
|
MS_EXCEPTION_IF_NULL(kernel_graph);
|
||||||
|
@ -704,6 +713,7 @@ bool GPUSession::DumpDataEnabledIteration() const {
|
||||||
MS_EXCEPTION_IF_NULL(runtime_instance);
|
MS_EXCEPTION_IF_NULL(runtime_instance);
|
||||||
return runtime_instance->DumpDataEnabledIteration();
|
return runtime_instance->DumpDataEnabledIteration();
|
||||||
}
|
}
|
||||||
|
#endif
|
||||||
|
|
||||||
void GPUSession::SyncStream() const {
|
void GPUSession::SyncStream() const {
|
||||||
auto runtime_instance = device::KernelRuntimeManager::Instance().GetSingleKernelRuntime(kGPUDevice, device_id_);
|
auto runtime_instance = device::KernelRuntimeManager::Instance().GetSingleKernelRuntime(kGPUDevice, device_id_);
|
||||||
|
|
|
@ -90,11 +90,13 @@ class GPUSession : public SessionBasic {
|
||||||
|
|
||||||
void Execute(const std::shared_ptr<KernelGraph> &kernel_graph) const;
|
void Execute(const std::shared_ptr<KernelGraph> &kernel_graph) const;
|
||||||
|
|
||||||
|
#ifdef ENABLE_DEBUGGER
|
||||||
void Dump(const std::shared_ptr<KernelGraph> &kernel_graph) const;
|
void Dump(const std::shared_ptr<KernelGraph> &kernel_graph) const;
|
||||||
|
|
||||||
void DumpSetup(const std::shared_ptr<KernelGraph> &kernel_graph) const;
|
void DumpSetup(const std::shared_ptr<KernelGraph> &kernel_graph) const;
|
||||||
|
|
||||||
bool DumpDataEnabledIteration() const;
|
bool DumpDataEnabledIteration() const;
|
||||||
|
#endif
|
||||||
|
|
||||||
GraphId CompileGraphImpl(KernelGraphPtr kernel_graph);
|
GraphId CompileGraphImpl(KernelGraphPtr kernel_graph);
|
||||||
};
|
};
|
||||||
|
|
|
@ -33,7 +33,7 @@
|
||||||
#include "runtime/device/kernel_info.h"
|
#include "runtime/device/kernel_info.h"
|
||||||
#include "utils/ms_context.h"
|
#include "utils/ms_context.h"
|
||||||
#include "runtime/device/bucket.h"
|
#include "runtime/device/bucket.h"
|
||||||
#if !defined(_WIN32) && !defined(_WIN64)
|
#if defined(ENABLE_DEBUGGER) && !defined(_WIN32) && !defined(_WIN64)
|
||||||
#include "debug/debugger/debugger.h"
|
#include "debug/debugger/debugger.h"
|
||||||
#endif
|
#endif
|
||||||
#include "runtime/hardware/device_context.h"
|
#include "runtime/hardware/device_context.h"
|
||||||
|
@ -93,7 +93,7 @@ class Executor;
|
||||||
class SessionBasic : public std::enable_shared_from_this<SessionBasic> {
|
class SessionBasic : public std::enable_shared_from_this<SessionBasic> {
|
||||||
public:
|
public:
|
||||||
SessionBasic() : context_(nullptr), summary_callback_(nullptr), device_id_(0) {
|
SessionBasic() : context_(nullptr), summary_callback_(nullptr), device_id_(0) {
|
||||||
#if !defined(_WIN32) && !defined(_WIN64)
|
#if defined(ENABLE_DEBUGGER) && !defined(_WIN32) && !defined(_WIN64)
|
||||||
debugger_ = nullptr;
|
debugger_ = nullptr;
|
||||||
#endif
|
#endif
|
||||||
}
|
}
|
||||||
|
@ -319,7 +319,7 @@ class SessionBasic : public std::enable_shared_from_this<SessionBasic> {
|
||||||
// rank id of physical device
|
// rank id of physical device
|
||||||
uint32_t rank_id_{0};
|
uint32_t rank_id_{0};
|
||||||
std::shared_ptr<Executor> executor_;
|
std::shared_ptr<Executor> executor_;
|
||||||
#if !defined(_WIN32) && !defined(_WIN64)
|
#if defined(ENABLE_DEBUGGER) && !defined(_WIN32) && !defined(_WIN64)
|
||||||
std::shared_ptr<Debugger> debugger_;
|
std::shared_ptr<Debugger> debugger_;
|
||||||
#endif
|
#endif
|
||||||
};
|
};
|
||||||
|
|
|
@ -60,7 +60,8 @@ endif()
|
||||||
set_property(SOURCE ${_DEBUG_SRC_LIST} ${_RDR_SRC_LIST} PROPERTY COMPILE_DEFINITIONS
|
set_property(SOURCE ${_DEBUG_SRC_LIST} ${_RDR_SRC_LIST} PROPERTY COMPILE_DEFINITIONS
|
||||||
SUBMODULE_ID=mindspore::SubModuleId::SM_DEBUG)
|
SUBMODULE_ID=mindspore::SubModuleId::SM_DEBUG)
|
||||||
add_library(_mindspore_debug_obj OBJECT ${_DEBUG_SRC_LIST} ${_RDR_SRC_LIST})
|
add_library(_mindspore_debug_obj OBJECT ${_DEBUG_SRC_LIST} ${_RDR_SRC_LIST})
|
||||||
if(NOT CMAKE_SYSTEM_NAME MATCHES "Windows")
|
if(ENABLE_DEBUGGER)
|
||||||
|
if(NOT CMAKE_SYSTEM_NAME MATCHES "Windows")
|
||||||
add_compile_options(-Wall -DOFFLINE_DBG_MODE -fPIC -O2)
|
add_compile_options(-Wall -DOFFLINE_DBG_MODE -fPIC -O2)
|
||||||
set_property(SOURCE ${_OFFLINE_SRC_LIST} PROPERTY COMPILE_DEFINITIONS
|
set_property(SOURCE ${_OFFLINE_SRC_LIST} PROPERTY COMPILE_DEFINITIONS
|
||||||
SUBMODULE_ID=mindspore::SubModuleId::SM_OFFLINE_DEBUG)
|
SUBMODULE_ID=mindspore::SubModuleId::SM_OFFLINE_DEBUG)
|
||||||
|
@ -69,4 +70,5 @@ if(NOT CMAKE_SYSTEM_NAME MATCHES "Windows")
|
||||||
PREFIX "${PYTHON_MODULE_PREFIX}"
|
PREFIX "${PYTHON_MODULE_PREFIX}"
|
||||||
SUFFIX "${PYTHON_MODULE_EXTENSION}"
|
SUFFIX "${PYTHON_MODULE_EXTENSION}"
|
||||||
)
|
)
|
||||||
|
endif()
|
||||||
endif()
|
endif()
|
||||||
|
|
|
@ -103,7 +103,9 @@ const char IR_TYPE_MINDIR[] = "mind_ir";
|
||||||
|
|
||||||
GraphExecutorPyPtr GraphExecutorPy::executor_ = nullptr;
|
GraphExecutorPyPtr GraphExecutorPy::executor_ = nullptr;
|
||||||
std::mutex GraphExecutorPy::instance_lock_;
|
std::mutex GraphExecutorPy::instance_lock_;
|
||||||
|
#ifdef ENABLE_DEBUGGER
|
||||||
bool GraphExecutorPy::debugger_terminate_ = false;
|
bool GraphExecutorPy::debugger_terminate_ = false;
|
||||||
|
#endif
|
||||||
|
|
||||||
std::unordered_map<abstract::AbstractBasePtrList, uint64_t, abstract::AbstractBasePtrListHasher,
|
std::unordered_map<abstract::AbstractBasePtrList, uint64_t, abstract::AbstractBasePtrListHasher,
|
||||||
abstract::AbstractBasePtrListEqual>
|
abstract::AbstractBasePtrListEqual>
|
||||||
|
@ -683,8 +685,10 @@ std::vector<ActionItem> GetPipeline(const ResourcePtr &resource, const std::stri
|
||||||
compile::SetMindRTEnable();
|
compile::SetMindRTEnable();
|
||||||
// Create backend.
|
// Create backend.
|
||||||
auto backend_ptr = compile::CreateBackend();
|
auto backend_ptr = compile::CreateBackend();
|
||||||
|
#ifdef ENABLE_DEBUGGER
|
||||||
// Connect session to debugger
|
// Connect session to debugger
|
||||||
backend_ptr->SetDebugger();
|
backend_ptr->SetDebugger();
|
||||||
|
#endif
|
||||||
resource->results()[kBackend] = backend_ptr;
|
resource->results()[kBackend] = backend_ptr;
|
||||||
// If the 'use_frontend_compile_cache' context has been set true and the cache is read successfully,
|
// If the 'use_frontend_compile_cache' context has been set true and the cache is read successfully,
|
||||||
// do the backend actions only.
|
// do the backend actions only.
|
||||||
|
@ -990,6 +994,7 @@ void GraphExecutorPy::ProcessVmArg(const py::tuple &args, const std::string &pha
|
||||||
ProcessVmArgInner(args, GetResource(phase), arg_list);
|
ProcessVmArgInner(args, GetResource(phase), arg_list);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
#ifdef ENABLE_DEBUGGER
|
||||||
void GraphExecutorPy::TerminateDebugger() {
|
void GraphExecutorPy::TerminateDebugger() {
|
||||||
if (debugger_terminate_) {
|
if (debugger_terminate_) {
|
||||||
MS_LOG(INFO) << "Terminate debugger and clear resources!";
|
MS_LOG(INFO) << "Terminate debugger and clear resources!";
|
||||||
|
@ -997,10 +1002,13 @@ void GraphExecutorPy::TerminateDebugger() {
|
||||||
exit(1);
|
exit(1);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
#endif
|
||||||
|
|
||||||
py::object GraphExecutorPy::Run(const py::tuple &args, const py::object &phase_obj) {
|
py::object GraphExecutorPy::Run(const py::tuple &args, const py::object &phase_obj) {
|
||||||
// Mindspore debugger notify main thread to exit after one step, and will not run next step
|
// Mindspore debugger notify main thread to exit after one step, and will not run next step
|
||||||
|
#ifdef ENABLE_DEBUGGER
|
||||||
TerminateDebugger();
|
TerminateDebugger();
|
||||||
|
#endif
|
||||||
std::size_t size = args.size();
|
std::size_t size = args.size();
|
||||||
if (!py::isinstance<py::str>(phase_obj)) {
|
if (!py::isinstance<py::str>(phase_obj)) {
|
||||||
MS_LOG(EXCEPTION) << "Run failed, phase input is not a str";
|
MS_LOG(EXCEPTION) << "Run failed, phase input is not a str";
|
||||||
|
|
|
@ -107,9 +107,11 @@ class GraphExecutorPy : public std::enable_shared_from_this<GraphExecutorPy> {
|
||||||
void DelNetRes(const std::string &id);
|
void DelNetRes(const std::string &id);
|
||||||
void ReleaseResource(const py::object &phase_obj);
|
void ReleaseResource(const py::object &phase_obj);
|
||||||
static void ClearRes();
|
static void ClearRes();
|
||||||
|
#ifdef ENABLE_DEBUGGER
|
||||||
static bool GetDebugTerminate() { return debugger_terminate_; }
|
static bool GetDebugTerminate() { return debugger_terminate_; }
|
||||||
static void DebugTerminate(bool val) { debugger_terminate_ = val; }
|
static void DebugTerminate(bool val) { debugger_terminate_ = val; }
|
||||||
void TerminateDebugger();
|
void TerminateDebugger();
|
||||||
|
#endif
|
||||||
|
|
||||||
std::map<std::string, std::pair<PrimitivePyAdapterPtr, std::string>> FetchInfoForQuantExport(
|
std::map<std::string, std::pair<PrimitivePyAdapterPtr, std::string>> FetchInfoForQuantExport(
|
||||||
const std::string &phase);
|
const std::string &phase);
|
||||||
|
@ -127,7 +129,9 @@ class GraphExecutorPy : public std::enable_shared_from_this<GraphExecutorPy> {
|
||||||
std::map<std::string, ExecutorInfoPtr> info_;
|
std::map<std::string, ExecutorInfoPtr> info_;
|
||||||
static std::shared_ptr<GraphExecutorPy> executor_;
|
static std::shared_ptr<GraphExecutorPy> executor_;
|
||||||
static std::mutex instance_lock_;
|
static std::mutex instance_lock_;
|
||||||
|
#ifdef ENABLE_DEBUGGER
|
||||||
static bool debugger_terminate_;
|
static bool debugger_terminate_;
|
||||||
|
#endif
|
||||||
std::map<std::string, py::dict> stra_dict_;
|
std::map<std::string, py::dict> stra_dict_;
|
||||||
std::string phase_ = "";
|
std::string phase_ = "";
|
||||||
std::map<std::string, size_t> phase_to_num_op_info_;
|
std::map<std::string, size_t> phase_to_num_op_info_;
|
||||||
|
|
|
@ -358,8 +358,9 @@ bool AscendKernelRuntime::Init() {
|
||||||
if (!ret) {
|
if (!ret) {
|
||||||
return ret;
|
return ret;
|
||||||
}
|
}
|
||||||
|
#ifdef ENABLE_DEBUGGER
|
||||||
SetDebugger();
|
SetDebugger();
|
||||||
|
#endif
|
||||||
mem_manager_ = std::make_shared<AscendMemoryManager>();
|
mem_manager_ = std::make_shared<AscendMemoryManager>();
|
||||||
MS_EXCEPTION_IF_NULL(mem_manager_);
|
MS_EXCEPTION_IF_NULL(mem_manager_);
|
||||||
mem_manager_->MallocDeviceMemory();
|
mem_manager_->MallocDeviceMemory();
|
||||||
|
@ -583,7 +584,6 @@ void AscendKernelRuntime::DistributeDebugTask(NotNull<const session::KernelGraph
|
||||||
MS_LOG(WARNING) << "[DataDump] Insert graphId:" << graph->graph_id() << " data dumper failed";
|
MS_LOG(WARNING) << "[DataDump] Insert graphId:" << graph->graph_id() << " data dumper failed";
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
#endif
|
|
||||||
|
|
||||||
void AscendKernelRuntime::LaunchDataDump(GraphId graph_id) {
|
void AscendKernelRuntime::LaunchDataDump(GraphId graph_id) {
|
||||||
if (!DumpJsonParser::GetInstance().async_dump_enabled()) {
|
if (!DumpJsonParser::GetInstance().async_dump_enabled()) {
|
||||||
|
@ -600,6 +600,7 @@ void AscendKernelRuntime::LaunchDataDump(GraphId graph_id) {
|
||||||
MS_LOG(EXCEPTION) << "GraphId:" << graph_id << " not found";
|
MS_LOG(EXCEPTION) << "GraphId:" << graph_id << " not found";
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
#endif
|
||||||
|
|
||||||
void AscendKernelRuntime::TaskFailCallback(rtExceptionInfo *task_fail_info) {
|
void AscendKernelRuntime::TaskFailCallback(rtExceptionInfo *task_fail_info) {
|
||||||
MS_EXCEPTION_IF_NULL(task_fail_info);
|
MS_EXCEPTION_IF_NULL(task_fail_info);
|
||||||
|
|
|
@ -49,8 +49,10 @@ bool TaskGenerator::GenTasks(const std::vector<CNodePtr> &anf_node_list, std::ve
|
||||||
MS_EXCEPTION_IF_NULL(context_ptr);
|
MS_EXCEPTION_IF_NULL(context_ptr);
|
||||||
bool save_graphs = context_ptr->get_param<bool>(MS_CTX_SAVE_GRAPHS_FLAG);
|
bool save_graphs = context_ptr->get_param<bool>(MS_CTX_SAVE_GRAPHS_FLAG);
|
||||||
if (save_graphs) {
|
if (save_graphs) {
|
||||||
|
#ifndef ENABLE_SECURITY
|
||||||
std::string file_path = GetSaveGraphsPathName("task_info_graph_" + std::to_string(graph_id) + ".ir");
|
std::string file_path = GetSaveGraphsPathName("task_info_graph_" + std::to_string(graph_id) + ".ir");
|
||||||
DumpTaskInfo(file_path);
|
DumpTaskInfo(file_path);
|
||||||
|
#endif
|
||||||
}
|
}
|
||||||
return true;
|
return true;
|
||||||
}
|
}
|
||||||
|
|
|
@ -127,6 +127,7 @@ void GPUDeviceAddress::ClearDeviceMemory() {
|
||||||
|
|
||||||
GPUDeviceAddress::~GPUDeviceAddress() { ClearDeviceMemory(); }
|
GPUDeviceAddress::~GPUDeviceAddress() { ClearDeviceMemory(); }
|
||||||
|
|
||||||
|
#ifdef ENABLE_DEBUGGER
|
||||||
bool GPUDeviceAddress::LoadMemToHost(const std::string &tensor_name, int execution_order, const std::string &host_fmt,
|
bool GPUDeviceAddress::LoadMemToHost(const std::string &tensor_name, int execution_order, const std::string &host_fmt,
|
||||||
const ShapeVector &host_shape, TypeId host_type, size_t slot,
|
const ShapeVector &host_shape, TypeId host_type, size_t slot,
|
||||||
bool keep_prev) const {
|
bool keep_prev) const {
|
||||||
|
@ -161,6 +162,7 @@ bool GPUDeviceAddress::LoadMemToHost(const std::string &tensor_name, int executi
|
||||||
MS_LOG(INFO) << "E2E tensor name is " << tensor_name;
|
MS_LOG(INFO) << "E2E tensor name is " << tensor_name;
|
||||||
return ret;
|
return ret;
|
||||||
}
|
}
|
||||||
|
#endif
|
||||||
} // namespace gpu
|
} // namespace gpu
|
||||||
} // namespace device
|
} // namespace device
|
||||||
} // namespace mindspore
|
} // namespace mindspore
|
||||||
|
|
|
@ -38,7 +38,9 @@
|
||||||
#include "profiler/device/gpu/gpu_profiling.h"
|
#include "profiler/device/gpu/gpu_profiling.h"
|
||||||
#include "profiler/device/gpu/gpu_profiling_utils.h"
|
#include "profiler/device/gpu/gpu_profiling_utils.h"
|
||||||
#include "utils/shape_utils.h"
|
#include "utils/shape_utils.h"
|
||||||
|
#ifndef ENABLE_SECURITY
|
||||||
#include "debug/data_dump/dump_json_parser.h"
|
#include "debug/data_dump/dump_json_parser.h"
|
||||||
|
#endif
|
||||||
#include "backend/kernel_compiler/gpu/gpu_kernel.h"
|
#include "backend/kernel_compiler/gpu/gpu_kernel.h"
|
||||||
#ifdef ENABLE_DEBUGGER
|
#ifdef ENABLE_DEBUGGER
|
||||||
#include "debug/debug_services.h"
|
#include "debug/debug_services.h"
|
||||||
|
@ -85,7 +87,9 @@ bool GPUKernelRuntime::Init() {
|
||||||
MS_LOG(ERROR) << "InitDevice error.";
|
MS_LOG(ERROR) << "InitDevice error.";
|
||||||
return ret;
|
return ret;
|
||||||
}
|
}
|
||||||
|
#ifndef ENABLE_SECURITY
|
||||||
DumpJsonParser::GetInstance().Parse();
|
DumpJsonParser::GetInstance().Parse();
|
||||||
|
#endif
|
||||||
mem_manager_ = std::make_shared<GPUMemoryManager>();
|
mem_manager_ = std::make_shared<GPUMemoryManager>();
|
||||||
MS_EXCEPTION_IF_NULL(mem_manager_);
|
MS_EXCEPTION_IF_NULL(mem_manager_);
|
||||||
mem_manager_->MallocDeviceMemory();
|
mem_manager_->MallocDeviceMemory();
|
||||||
|
@ -98,7 +102,11 @@ bool GPUKernelRuntime::Init() {
|
||||||
(*init_nccl_comm_funcptr)();
|
(*init_nccl_comm_funcptr)();
|
||||||
}
|
}
|
||||||
device_init_ = true;
|
device_init_ = true;
|
||||||
|
|
||||||
|
#ifdef ENABLE_DEBUGGER
|
||||||
SetDebugger();
|
SetDebugger();
|
||||||
|
#endif
|
||||||
|
|
||||||
return ret;
|
return ret;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -120,6 +128,7 @@ std::vector<int> CheckRealOutput(const std::string &node_name, const size_t &out
|
||||||
return real_outputs;
|
return real_outputs;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
#ifdef ENABLE_DEBUGGER
|
||||||
void LoadKernelData(Debugger *debugger, const CNodePtr &kernel,
|
void LoadKernelData(Debugger *debugger, const CNodePtr &kernel,
|
||||||
const std::vector<mindspore::kernel::AddressPtr> &kernel_inputs,
|
const std::vector<mindspore::kernel::AddressPtr> &kernel_inputs,
|
||||||
const std::vector<mindspore::kernel::AddressPtr> &kernel_workspaces,
|
const std::vector<mindspore::kernel::AddressPtr> &kernel_workspaces,
|
||||||
|
@ -199,6 +208,7 @@ void LoadKernelData(Debugger *debugger, const CNodePtr &kernel,
|
||||||
}
|
}
|
||||||
debugger->PostExecuteNode(kernel, last_kernel);
|
debugger->PostExecuteNode(kernel, last_kernel);
|
||||||
}
|
}
|
||||||
|
#endif
|
||||||
} // namespace
|
} // namespace
|
||||||
|
|
||||||
bool GPUKernelRuntime::MemcpyAsync(void *dst, const void *src, uint64_t size, int32_t kind) {
|
bool GPUKernelRuntime::MemcpyAsync(void *dst, const void *src, uint64_t size, int32_t kind) {
|
||||||
|
@ -723,10 +733,12 @@ bool GPUKernelRuntime::LaunchKernelDynamic(const session::KernelGraph *graph, bo
|
||||||
AllocCommunicationOpDynamicRes(graph);
|
AllocCommunicationOpDynamicRes(graph);
|
||||||
AllocInplaceNodeMemory(graph);
|
AllocInplaceNodeMemory(graph);
|
||||||
|
|
||||||
|
#ifdef ENABLE_DEBUGGER
|
||||||
bool dump_enabled = GPUKernelRuntime::DumpDataEnabledIteration();
|
bool dump_enabled = GPUKernelRuntime::DumpDataEnabledIteration();
|
||||||
if (!mock && debugger_) {
|
if (!mock && debugger_) {
|
||||||
debugger_->UpdateStepNum(graph);
|
debugger_->UpdateStepNum(graph);
|
||||||
}
|
}
|
||||||
|
#endif
|
||||||
auto &kernels = graph->execution_order();
|
auto &kernels = graph->execution_order();
|
||||||
int exec_order = 1;
|
int exec_order = 1;
|
||||||
#ifdef ENABLE_DUMP_IR
|
#ifdef ENABLE_DUMP_IR
|
||||||
|
@ -760,11 +772,13 @@ bool GPUKernelRuntime::LaunchKernelDynamic(const session::KernelGraph *graph, bo
|
||||||
AddressPtrList kernel_outputs;
|
AddressPtrList kernel_outputs;
|
||||||
auto ret = AllocKernelDynamicRes(*kernel_mod, kernel, &kernel_inputs, &kernel_workspaces, &kernel_outputs, mock);
|
auto ret = AllocKernelDynamicRes(*kernel_mod, kernel, &kernel_inputs, &kernel_workspaces, &kernel_outputs, mock);
|
||||||
if (!ret) {
|
if (!ret) {
|
||||||
|
#ifdef ENABLE_DEBUGGER
|
||||||
if (!mock) {
|
if (!mock) {
|
||||||
MS_EXCEPTION_IF_NULL(debugger_);
|
MS_EXCEPTION_IF_NULL(debugger_);
|
||||||
// invalidate current data collected by the debugger
|
// invalidate current data collected by the debugger
|
||||||
debugger_->ClearCurrentData();
|
debugger_->ClearCurrentData();
|
||||||
}
|
}
|
||||||
|
#endif
|
||||||
return false;
|
return false;
|
||||||
}
|
}
|
||||||
#ifdef ENABLE_DUMP_IR
|
#ifdef ENABLE_DUMP_IR
|
||||||
|
@ -778,18 +792,21 @@ bool GPUKernelRuntime::LaunchKernelDynamic(const session::KernelGraph *graph, bo
|
||||||
if (gpu_kernel != nullptr && dynamic_kernel != nullptr && dynamic_kernel->is_dynamic_shape()) {
|
if (gpu_kernel != nullptr && dynamic_kernel != nullptr && dynamic_kernel->is_dynamic_shape()) {
|
||||||
gpu_kernel->PostExecute();
|
gpu_kernel->PostExecute();
|
||||||
}
|
}
|
||||||
|
#ifdef ENABLE_DEBUGGER
|
||||||
// called once per kernel to collect the outputs to the kernel (does a SyncDeviceToHost)
|
// called once per kernel to collect the outputs to the kernel (does a SyncDeviceToHost)
|
||||||
LoadKernelData(debugger_.get(), kernel, kernel_inputs, kernel_workspaces, kernel_outputs, exec_order, stream_,
|
LoadKernelData(debugger_.get(), kernel, kernel_inputs, kernel_workspaces, kernel_outputs, exec_order, stream_,
|
||||||
dump_enabled, kernel == last_kernel);
|
dump_enabled, kernel == last_kernel);
|
||||||
|
#endif
|
||||||
}
|
}
|
||||||
exec_order = exec_order + 1;
|
exec_order = exec_order + 1;
|
||||||
FreeKernelDynamicRes(kernel);
|
FreeKernelDynamicRes(kernel);
|
||||||
if (!UpdateMemorySwapTask(kernel, mock, profiling)) {
|
if (!UpdateMemorySwapTask(kernel, mock, profiling)) {
|
||||||
|
#ifdef ENABLE_DEBUGGER
|
||||||
if (!mock) {
|
if (!mock) {
|
||||||
// invalidate current data collected by the debugger
|
// invalidate current data collected by the debugger
|
||||||
debugger_->ClearCurrentData();
|
debugger_->ClearCurrentData();
|
||||||
}
|
}
|
||||||
|
#endif
|
||||||
return false;
|
return false;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
|
@ -190,6 +190,7 @@ void KernelRuntime::RunOpClearMemory(const session::KernelGraph *graph) const {
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
#ifdef ENABLE_DEBUGGER
|
||||||
bool KernelRuntime::DumpDataEnabled() {
|
bool KernelRuntime::DumpDataEnabled() {
|
||||||
auto &dump_json_parser = DumpJsonParser::GetInstance();
|
auto &dump_json_parser = DumpJsonParser::GetInstance();
|
||||||
return dump_json_parser.e2e_dump_enabled();
|
return dump_json_parser.e2e_dump_enabled();
|
||||||
|
@ -207,6 +208,7 @@ bool KernelRuntime::DumpDataEnabledIteration() {
|
||||||
}
|
}
|
||||||
return false;
|
return false;
|
||||||
}
|
}
|
||||||
|
#endif
|
||||||
|
|
||||||
void KernelRuntime::AssignStaticMemory(session::KernelGraph *graph) {
|
void KernelRuntime::AssignStaticMemory(session::KernelGraph *graph) {
|
||||||
AssignStaticMemoryInput(graph);
|
AssignStaticMemoryInput(graph);
|
||||||
|
|
|
@ -59,8 +59,10 @@ class KernelRuntime {
|
||||||
const std::map<tensor::TensorPtr, session::KernelWithIndex> &tensor_to_node = {});
|
const std::map<tensor::TensorPtr, session::KernelWithIndex> &tensor_to_node = {});
|
||||||
void RunOpClearMemory(const session::KernelGraph *graph) const;
|
void RunOpClearMemory(const session::KernelGraph *graph) const;
|
||||||
void RunOpMallocPre(const session::KernelGraph &graph, const std::vector<tensor::TensorPtr> &input_tensors);
|
void RunOpMallocPre(const session::KernelGraph &graph, const std::vector<tensor::TensorPtr> &input_tensors);
|
||||||
|
#ifdef ENABLE_DEBUGGER
|
||||||
static bool DumpDataEnabled();
|
static bool DumpDataEnabled();
|
||||||
static bool DumpDataEnabledIteration();
|
static bool DumpDataEnabledIteration();
|
||||||
|
#endif
|
||||||
virtual bool LoadData(session::KernelGraph *graph);
|
virtual bool LoadData(session::KernelGraph *graph);
|
||||||
virtual bool Load(session::KernelGraph *graph, bool is_task_sink);
|
virtual bool Load(session::KernelGraph *graph, bool is_task_sink);
|
||||||
virtual bool Run(session::KernelGraph *graph, bool is_task_sink) = 0;
|
virtual bool Run(session::KernelGraph *graph, bool is_task_sink) = 0;
|
||||||
|
@ -92,12 +94,14 @@ class KernelRuntime {
|
||||||
void set_device_id(uint32_t device_id) { device_id_ = device_id; }
|
void set_device_id(uint32_t device_id) { device_id_ = device_id; }
|
||||||
uint32_t device_id() { return device_id_; }
|
uint32_t device_id() { return device_id_; }
|
||||||
|
|
||||||
|
#ifdef ENABLE_DEBUGGER
|
||||||
// set debugger
|
// set debugger
|
||||||
void SetDebugger() {
|
void SetDebugger() {
|
||||||
#if !defined(_WIN32) && !defined(_WIN64)
|
#if !defined(_WIN32) && !defined(_WIN64)
|
||||||
debugger_ = Debugger::GetInstance();
|
debugger_ = Debugger::GetInstance();
|
||||||
#endif
|
#endif
|
||||||
}
|
}
|
||||||
|
#endif
|
||||||
|
|
||||||
#ifndef ENABLE_SECURITY
|
#ifndef ENABLE_SECURITY
|
||||||
virtual void PreInit() {}
|
virtual void PreInit() {}
|
||||||
|
@ -159,7 +163,7 @@ class KernelRuntime {
|
||||||
protected:
|
protected:
|
||||||
uint32_t device_id_{0};
|
uint32_t device_id_{0};
|
||||||
bool pynative_mode_profiling_flag_{false};
|
bool pynative_mode_profiling_flag_{false};
|
||||||
#if !defined(_WIN32) && !defined(_WIN64)
|
#if defined(ENABLE_DEBUGGER) && !defined(_WIN32) && !defined(_WIN64)
|
||||||
std::shared_ptr<Debugger> debugger_;
|
std::shared_ptr<Debugger> debugger_;
|
||||||
#endif
|
#endif
|
||||||
void *stream_{nullptr};
|
void *stream_{nullptr};
|
||||||
|
|
|
@ -21,7 +21,9 @@
|
||||||
#include "runtime/framework/actor/debug_aware_actor.h"
|
#include "runtime/framework/actor/debug_aware_actor.h"
|
||||||
#include "mindrt/include/async/async.h"
|
#include "mindrt/include/async/async.h"
|
||||||
#include "utils/log_adapter.h"
|
#include "utils/log_adapter.h"
|
||||||
|
#ifndef ENABLE_SECURITY
|
||||||
#include "debug/data_dump/cpu_e2e_dump.h"
|
#include "debug/data_dump/cpu_e2e_dump.h"
|
||||||
|
#endif
|
||||||
#ifdef ENABLE_DEBUGGER
|
#ifdef ENABLE_DEBUGGER
|
||||||
#include "debug/debugger/debugger.h"
|
#include "debug/debugger/debugger.h"
|
||||||
#include "debug/debugger/debugger_utils.h"
|
#include "debug/debugger/debugger_utils.h"
|
||||||
|
@ -45,11 +47,13 @@ void DebugActor::Debug(const AnfNodePtr &node, const KernelLaunchInfo *launch_in
|
||||||
|
|
||||||
const auto &cnode = node->cast<CNodePtr>();
|
const auto &cnode = node->cast<CNodePtr>();
|
||||||
if (device_context->GetDeviceAddressType() == device::DeviceAddressType::kCPU) {
|
if (device_context->GetDeviceAddressType() == device::DeviceAddressType::kCPU) {
|
||||||
|
#ifndef ENABLE_SECURITY
|
||||||
if (DumpJsonParser::GetInstance().GetIterDumpFlag()) {
|
if (DumpJsonParser::GetInstance().GetIterDumpFlag()) {
|
||||||
auto kernel_graph = std::dynamic_pointer_cast<session::KernelGraph>(cnode->func_graph());
|
auto kernel_graph = std::dynamic_pointer_cast<session::KernelGraph>(cnode->func_graph());
|
||||||
MS_EXCEPTION_IF_NULL(kernel_graph);
|
MS_EXCEPTION_IF_NULL(kernel_graph);
|
||||||
CPUE2eDump::DumpCNodeData(cnode, kernel_graph->graph_id());
|
CPUE2eDump::DumpCNodeData(cnode, kernel_graph->graph_id());
|
||||||
}
|
}
|
||||||
|
#endif
|
||||||
} else if (device_context->GetDeviceAddressType() == device::DeviceAddressType::kGPU) {
|
} else if (device_context->GetDeviceAddressType() == device::DeviceAddressType::kGPU) {
|
||||||
#ifdef ENABLE_DEBUGGER
|
#ifdef ENABLE_DEBUGGER
|
||||||
auto debugger = Debugger::GetInstance();
|
auto debugger = Debugger::GetInstance();
|
||||||
|
@ -73,9 +77,11 @@ void DebugActor::DebugOnStepEnd(OpContext<DeviceTensor> *const op_context, const
|
||||||
MS_EXCEPTION_IF_NULL(op_context);
|
MS_EXCEPTION_IF_NULL(op_context);
|
||||||
MS_EXCEPTION_IF_NULL(from_aid);
|
MS_EXCEPTION_IF_NULL(from_aid);
|
||||||
|
|
||||||
|
#ifndef ENABLE_SECURITY
|
||||||
if (DumpJsonParser::GetInstance().GetIterDumpFlag()) {
|
if (DumpJsonParser::GetInstance().GetIterDumpFlag()) {
|
||||||
CPUE2eDump::DumpParametersAndConst();
|
CPUE2eDump::DumpParametersAndConst();
|
||||||
}
|
}
|
||||||
|
#endif
|
||||||
|
|
||||||
#ifdef ENABLE_DEBUGGER
|
#ifdef ENABLE_DEBUGGER
|
||||||
auto debugger = Debugger::GetInstance();
|
auto debugger = Debugger::GetInstance();
|
||||||
|
@ -86,7 +92,9 @@ void DebugActor::DebugOnStepEnd(OpContext<DeviceTensor> *const op_context, const
|
||||||
debugger->Debugger::PostExecuteGraphDebugger();
|
debugger->Debugger::PostExecuteGraphDebugger();
|
||||||
}
|
}
|
||||||
#else
|
#else
|
||||||
|
#ifndef ENABLE_SECURITY
|
||||||
DumpJsonParser::GetInstance().UpdateDumpIter();
|
DumpJsonParser::GetInstance().UpdateDumpIter();
|
||||||
|
#endif
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
// Call back to the from actor to process after debug finished.
|
// Call back to the from actor to process after debug finished.
|
||||||
|
|
|
@ -41,7 +41,9 @@
|
||||||
#include "debug/rdr/running_data_recorder.h"
|
#include "debug/rdr/running_data_recorder.h"
|
||||||
#endif
|
#endif
|
||||||
#include "utils/comm_manager.h"
|
#include "utils/comm_manager.h"
|
||||||
|
#ifdef ENABLE_DEBUGGER
|
||||||
#include "debug/debugger/debugger.h"
|
#include "debug/debugger/debugger.h"
|
||||||
|
#endif
|
||||||
#include "backend/optimizer/pass/optimize_updatestate.h"
|
#include "backend/optimizer/pass/optimize_updatestate.h"
|
||||||
|
|
||||||
namespace mindspore {
|
namespace mindspore {
|
||||||
|
@ -95,13 +97,14 @@ void GPUDeviceContext::Initialize() {
|
||||||
(*init_nccl_comm_funcptr)();
|
(*init_nccl_comm_funcptr)();
|
||||||
}
|
}
|
||||||
|
|
||||||
|
#ifndef ENABLE_SECURITY
|
||||||
// Dump json config file if dump is enabled.
|
// Dump json config file if dump is enabled.
|
||||||
auto rank_id = GetRankID();
|
auto rank_id = GetRankID();
|
||||||
auto &json_parser = DumpJsonParser::GetInstance();
|
auto &json_parser = DumpJsonParser::GetInstance();
|
||||||
json_parser.Parse();
|
json_parser.Parse();
|
||||||
json_parser.CopyJsonToDir(rank_id);
|
json_parser.CopyJsonToDir(rank_id);
|
||||||
json_parser.CopyMSCfgJsonToDir(rank_id);
|
json_parser.CopyMSCfgJsonToDir(rank_id);
|
||||||
|
#endif
|
||||||
initialized_ = true;
|
initialized_ = true;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -135,11 +138,13 @@ bool GPUDeviceContext::InitDevice() {
|
||||||
|
|
||||||
void GPUDeviceContext::Destroy() {
|
void GPUDeviceContext::Destroy() {
|
||||||
// Release GPU buffer manager resource
|
// Release GPU buffer manager resource
|
||||||
|
#ifdef ENABLE_DEBUGGER
|
||||||
auto debugger = Debugger::GetInstance();
|
auto debugger = Debugger::GetInstance();
|
||||||
if (debugger && debugger->debugger_enabled()) {
|
if (debugger && debugger->debugger_enabled()) {
|
||||||
debugger->SetTrainingDone(true);
|
debugger->SetTrainingDone(true);
|
||||||
debugger->SendMetadata(false);
|
debugger->SendMetadata(false);
|
||||||
}
|
}
|
||||||
|
#endif
|
||||||
|
|
||||||
if (GpuBufferMgr::GetInstance().IsInit()) {
|
if (GpuBufferMgr::GetInstance().IsInit()) {
|
||||||
if (!GpuBufferMgr::GetInstance().IsClosed() && !GpuBufferMgr::GetInstance().CloseNotify()) {
|
if (!GpuBufferMgr::GetInstance().IsClosed() && !GpuBufferMgr::GetInstance().CloseNotify()) {
|
||||||
|
|
|
@ -39,7 +39,9 @@
|
||||||
#ifdef ENABLE_DEBUGGER
|
#ifdef ENABLE_DEBUGGER
|
||||||
#include "debug/debugger/debugger.h"
|
#include "debug/debugger/debugger.h"
|
||||||
#endif
|
#endif
|
||||||
|
#ifndef ENABLE_SECURITY
|
||||||
#include "debug/data_dump/dump_json_parser.h"
|
#include "debug/data_dump/dump_json_parser.h"
|
||||||
|
#endif
|
||||||
#ifdef ENABLE_DUMP_IR
|
#ifdef ENABLE_DUMP_IR
|
||||||
#include "debug/rdr/running_data_recorder.h"
|
#include "debug/rdr/running_data_recorder.h"
|
||||||
#endif
|
#endif
|
||||||
|
|
|
@ -16,6 +16,11 @@ This module provides APIs to load and process dump data, i.e. read tensors, chec
|
||||||
for watchpoints and other debugging services.
|
for watchpoints and other debugging services.
|
||||||
"""
|
"""
|
||||||
|
|
||||||
|
from mindspore._c_expression import security
|
||||||
from . import dbg_services
|
from . import dbg_services
|
||||||
from . import mi_validator_helpers
|
from . import mi_validator_helpers
|
||||||
from . import mi_validators
|
from . import mi_validators
|
||||||
|
|
||||||
|
if security.enable_security():
|
||||||
|
raise ModuleNotFoundError("Offline debugger is not supported in security mode."\
|
||||||
|
"Please recompile mindspore without `-s on`.")
|
||||||
|
|
|
@ -16,6 +16,7 @@
|
||||||
The module DbgServices provides offline debugger APIs.
|
The module DbgServices provides offline debugger APIs.
|
||||||
"""
|
"""
|
||||||
|
|
||||||
|
from mindspore._c_expression import security
|
||||||
import mindspore._mindspore_offline_debug as cds
|
import mindspore._mindspore_offline_debug as cds
|
||||||
from mindspore.offline_debug.mi_validators import check_init, check_initialize, check_add_watchpoint,\
|
from mindspore.offline_debug.mi_validators import check_init, check_initialize, check_add_watchpoint,\
|
||||||
check_remove_watchpoint, check_check_watchpoints, check_read_tensor_info, check_initialize_done, \
|
check_remove_watchpoint, check_check_watchpoints, check_read_tensor_info, check_initialize_done, \
|
||||||
|
@ -35,6 +36,9 @@ def get_version():
|
||||||
>>> from mindspore.ccsrc.debug.debugger.offline_debug import dbg_services
|
>>> from mindspore.ccsrc.debug.debugger.offline_debug import dbg_services
|
||||||
>>> version = dbg_services.get_version()
|
>>> version = dbg_services.get_version()
|
||||||
"""
|
"""
|
||||||
|
if security.enable_security():
|
||||||
|
raise ValueError("Offline debugger is not supported in security mode. " \
|
||||||
|
"Please recompile mindspore without `-s on`.")
|
||||||
return cds.DbgServices(False).GetVersion()
|
return cds.DbgServices(False).GetVersion()
|
||||||
|
|
||||||
class DbgLogger:
|
class DbgLogger:
|
||||||
|
@ -75,6 +79,9 @@ class DbgServices():
|
||||||
|
|
||||||
@check_init
|
@check_init
|
||||||
def __init__(self, dump_file_path, verbose=False):
|
def __init__(self, dump_file_path, verbose=False):
|
||||||
|
if security.enable_security():
|
||||||
|
raise ValueError("Offline debugger is not supported in security mode. "\
|
||||||
|
"Please recompile mindspore without `-s on`.")
|
||||||
log.verbose = verbose
|
log.verbose = verbose
|
||||||
log("in Python __init__, file path is ", dump_file_path)
|
log("in Python __init__, file path is ", dump_file_path)
|
||||||
self.dump_file_path = dump_file_path
|
self.dump_file_path = dump_file_path
|
||||||
|
@ -382,6 +389,9 @@ class TensorInfo():
|
||||||
|
|
||||||
@check_tensor_info_init
|
@check_tensor_info_init
|
||||||
def __init__(self, node_name, slot, iteration, rank_id, root_graph_id, is_output=True):
|
def __init__(self, node_name, slot, iteration, rank_id, root_graph_id, is_output=True):
|
||||||
|
if security.enable_security():
|
||||||
|
raise ValueError("Offline debugger is not supported in security mode. " \
|
||||||
|
"Please recompile mindspore without `-s on`.")
|
||||||
iteration = replace_minus_one(iteration)
|
iteration = replace_minus_one(iteration)
|
||||||
self.instance = cds.tensor_info(node_name, slot, iteration, rank_id, root_graph_id, is_output)
|
self.instance = cds.tensor_info(node_name, slot, iteration, rank_id, root_graph_id, is_output)
|
||||||
|
|
||||||
|
@ -531,6 +541,9 @@ class TensorData():
|
||||||
|
|
||||||
@check_tensor_data_init
|
@check_tensor_data_init
|
||||||
def __init__(self, data_ptr, data_size, dtype, shape):
|
def __init__(self, data_ptr, data_size, dtype, shape):
|
||||||
|
if security.enable_security():
|
||||||
|
raise ValueError("Offline debugger is not supported in security mode." \
|
||||||
|
"Please recompile mindspore without `-s on`.")
|
||||||
self.instance = cds.tensor_data(data_ptr, data_size, dtype, shape)
|
self.instance = cds.tensor_data(data_ptr, data_size, dtype, shape)
|
||||||
|
|
||||||
@property
|
@property
|
||||||
|
@ -627,6 +640,9 @@ class TensorBaseData():
|
||||||
"""
|
"""
|
||||||
@check_tensor_base_data_init
|
@check_tensor_base_data_init
|
||||||
def __init__(self, data_size, dtype, shape):
|
def __init__(self, data_size, dtype, shape):
|
||||||
|
if security.enable_security():
|
||||||
|
raise ValueError("Offline debugger is not supported in security mode. " \
|
||||||
|
"Please recompile mindspore without `-s on`.")
|
||||||
self.instance = cds.TensorBaseData(data_size, dtype, shape)
|
self.instance = cds.TensorBaseData(data_size, dtype, shape)
|
||||||
|
|
||||||
def __str__(self):
|
def __str__(self):
|
||||||
|
@ -727,6 +743,9 @@ class TensorStatData():
|
||||||
@check_tensor_stat_data_init
|
@check_tensor_stat_data_init
|
||||||
def __init__(self, data_size, dtype, shape, is_bool, max_value, min_value, avg_value, count,
|
def __init__(self, data_size, dtype, shape, is_bool, max_value, min_value, avg_value, count,
|
||||||
neg_zero_count, pos_zero_count, nan_count, neg_inf_count, pos_inf_count, zero_count):
|
neg_zero_count, pos_zero_count, nan_count, neg_inf_count, pos_inf_count, zero_count):
|
||||||
|
if security.enable_security():
|
||||||
|
raise ValueError("Offline debugger is not supported in security mode. " \
|
||||||
|
"Please recompile mindspore without `-s on`.")
|
||||||
self.instance = cds.TensorStatData(data_size, dtype, shape, is_bool, max_value,
|
self.instance = cds.TensorStatData(data_size, dtype, shape, is_bool, max_value,
|
||||||
min_value, avg_value, count, neg_zero_count,
|
min_value, avg_value, count, neg_zero_count,
|
||||||
pos_zero_count, nan_count, neg_inf_count,
|
pos_zero_count, nan_count, neg_inf_count,
|
||||||
|
@ -1064,6 +1083,9 @@ class WatchpointHit():
|
||||||
|
|
||||||
@check_watchpoint_hit_init
|
@check_watchpoint_hit_init
|
||||||
def __init__(self, name, slot, condition, watchpoint_id, parameters, error_code, rank_id, root_graph_id):
|
def __init__(self, name, slot, condition, watchpoint_id, parameters, error_code, rank_id, root_graph_id):
|
||||||
|
if security.enable_security():
|
||||||
|
raise ValueError("Offline debugger is not supported in security mode. " \
|
||||||
|
"Please recompile mindspore without `-s on`.")
|
||||||
parameter_list_inst = []
|
parameter_list_inst = []
|
||||||
for elem in parameters:
|
for elem in parameters:
|
||||||
parameter_list_inst.append(elem.instance)
|
parameter_list_inst.append(elem.instance)
|
||||||
|
@ -1285,6 +1307,9 @@ class Parameter():
|
||||||
|
|
||||||
@check_parameter_init
|
@check_parameter_init
|
||||||
def __init__(self, name, disabled, value, hit=False, actual_value=0.0):
|
def __init__(self, name, disabled, value, hit=False, actual_value=0.0):
|
||||||
|
if security.enable_security():
|
||||||
|
raise ValueError("Offline debugger is not supported in security mode. " \
|
||||||
|
"Please recompile mindspore without `-s on`.")
|
||||||
self.instance = cds.parameter(name, disabled, value, hit, actual_value)
|
self.instance = cds.parameter(name, disabled, value, hit, actual_value)
|
||||||
|
|
||||||
@property
|
@property
|
||||||
|
|
|
@ -20,6 +20,7 @@ import mindspore.offline_debug.dbg_services as d
|
||||||
import numpy as np
|
import numpy as np
|
||||||
import pytest
|
import pytest
|
||||||
from dump_test_utils import compare_actual_with_expected
|
from dump_test_utils import compare_actual_with_expected
|
||||||
|
from tests.security_utils import security_off_wrap
|
||||||
|
|
||||||
GENERATE_GOLDEN = False
|
GENERATE_GOLDEN = False
|
||||||
test_name = "async_sink_mode_true_read_tensors"
|
test_name = "async_sink_mode_true_read_tensors"
|
||||||
|
@ -30,6 +31,7 @@ test_name = "async_sink_mode_true_read_tensors"
|
||||||
@pytest.mark.platform_x86_ascend_training
|
@pytest.mark.platform_x86_ascend_training
|
||||||
@pytest.mark.env_onecard
|
@pytest.mark.env_onecard
|
||||||
@pytest.mark.skip(reason="needs updating")
|
@pytest.mark.skip(reason="needs updating")
|
||||||
|
@security_off_wrap
|
||||||
def test_async_sink_mode_true_read_tensors():
|
def test_async_sink_mode_true_read_tensors():
|
||||||
debugger_backend = d.DbgServices(
|
debugger_backend = d.DbgServices(
|
||||||
dump_file_path="/home/workspace/mindspore_dataset/dumps/async_sink_true/")
|
dump_file_path="/home/workspace/mindspore_dataset/dumps/async_sink_true/")
|
||||||
|
|
|
@ -19,6 +19,7 @@ Watchpoints test script for offline debugger APIs.
|
||||||
import mindspore.offline_debug.dbg_services as d
|
import mindspore.offline_debug.dbg_services as d
|
||||||
import pytest
|
import pytest
|
||||||
from dump_test_utils import compare_actual_with_expected
|
from dump_test_utils import compare_actual_with_expected
|
||||||
|
from tests.security_utils import security_off_wrap
|
||||||
|
|
||||||
GENERATE_GOLDEN = False
|
GENERATE_GOLDEN = False
|
||||||
test_name = "async_sink_mode_true_watchpoints"
|
test_name = "async_sink_mode_true_watchpoints"
|
||||||
|
@ -29,6 +30,7 @@ test_name = "async_sink_mode_true_watchpoints"
|
||||||
@pytest.mark.platform_x86_ascend_training
|
@pytest.mark.platform_x86_ascend_training
|
||||||
@pytest.mark.env_onecard
|
@pytest.mark.env_onecard
|
||||||
@pytest.mark.skip(reason="needs updating")
|
@pytest.mark.skip(reason="needs updating")
|
||||||
|
@security_off_wrap
|
||||||
def test_async_sink_mode_true_watchpoints():
|
def test_async_sink_mode_true_watchpoints():
|
||||||
if GENERATE_GOLDEN:
|
if GENERATE_GOLDEN:
|
||||||
f_write = open(test_name + ".expected", "w")
|
f_write = open(test_name + ".expected", "w")
|
||||||
|
|
|
@ -20,6 +20,7 @@ import mindspore.offline_debug.dbg_services as d
|
||||||
import numpy as np
|
import numpy as np
|
||||||
import pytest
|
import pytest
|
||||||
from dump_test_utils import compare_actual_with_expected
|
from dump_test_utils import compare_actual_with_expected
|
||||||
|
from tests.security_utils import security_off_wrap
|
||||||
|
|
||||||
GENERATE_GOLDEN = False
|
GENERATE_GOLDEN = False
|
||||||
test_name = "sync_trans_false_read_tensors"
|
test_name = "sync_trans_false_read_tensors"
|
||||||
|
@ -30,6 +31,7 @@ test_name = "sync_trans_false_read_tensors"
|
||||||
@pytest.mark.platform_x86_ascend_training
|
@pytest.mark.platform_x86_ascend_training
|
||||||
@pytest.mark.env_onecard
|
@pytest.mark.env_onecard
|
||||||
@pytest.mark.skip(reason="needs updating")
|
@pytest.mark.skip(reason="needs updating")
|
||||||
|
@security_off_wrap
|
||||||
def test_sync_trans_false_read_tensors():
|
def test_sync_trans_false_read_tensors():
|
||||||
|
|
||||||
debugger_backend = d.DbgServices(
|
debugger_backend = d.DbgServices(
|
||||||
|
|
|
@ -19,6 +19,7 @@ Watchpoints test script for offline debugger APIs.
|
||||||
import mindspore.offline_debug.dbg_services as d
|
import mindspore.offline_debug.dbg_services as d
|
||||||
import pytest
|
import pytest
|
||||||
from dump_test_utils import compare_actual_with_expected
|
from dump_test_utils import compare_actual_with_expected
|
||||||
|
from tests.security_utils import security_off_wrap
|
||||||
|
|
||||||
GENERATE_GOLDEN = False
|
GENERATE_GOLDEN = False
|
||||||
test_name = "sync_trans_false_watchpoints"
|
test_name = "sync_trans_false_watchpoints"
|
||||||
|
@ -29,6 +30,7 @@ test_name = "sync_trans_false_watchpoints"
|
||||||
@pytest.mark.platform_x86_ascend_training
|
@pytest.mark.platform_x86_ascend_training
|
||||||
@pytest.mark.env_onecard
|
@pytest.mark.env_onecard
|
||||||
@pytest.mark.skip(reason="needs updating")
|
@pytest.mark.skip(reason="needs updating")
|
||||||
|
@security_off_wrap
|
||||||
def test_sync_trans_false_watchpoints():
|
def test_sync_trans_false_watchpoints():
|
||||||
|
|
||||||
if GENERATE_GOLDEN:
|
if GENERATE_GOLDEN:
|
||||||
|
|
|
@ -20,6 +20,7 @@ import mindspore.offline_debug.dbg_services as d
|
||||||
import numpy as np
|
import numpy as np
|
||||||
import pytest
|
import pytest
|
||||||
from dump_test_utils import compare_actual_with_expected
|
from dump_test_utils import compare_actual_with_expected
|
||||||
|
from tests.security_utils import security_off_wrap
|
||||||
|
|
||||||
GENERATE_GOLDEN = False
|
GENERATE_GOLDEN = False
|
||||||
test_name = "sync_trans_true_read_tensors"
|
test_name = "sync_trans_true_read_tensors"
|
||||||
|
@ -30,6 +31,7 @@ test_name = "sync_trans_true_read_tensors"
|
||||||
@pytest.mark.platform_x86_ascend_training
|
@pytest.mark.platform_x86_ascend_training
|
||||||
@pytest.mark.env_onecard
|
@pytest.mark.env_onecard
|
||||||
@pytest.mark.skip(reason="needs updating")
|
@pytest.mark.skip(reason="needs updating")
|
||||||
|
@security_off_wrap
|
||||||
def test_sync_trans_true_read_tensors():
|
def test_sync_trans_true_read_tensors():
|
||||||
|
|
||||||
debugger_backend = d.DbgServices(
|
debugger_backend = d.DbgServices(
|
||||||
|
|
|
@ -33,6 +33,7 @@ from mindspore.nn import Momentum
|
||||||
from mindspore.nn import TrainOneStepCell
|
from mindspore.nn import TrainOneStepCell
|
||||||
from mindspore.nn import WithLossCell
|
from mindspore.nn import WithLossCell
|
||||||
from dump_test_utils import generate_dump_json
|
from dump_test_utils import generate_dump_json
|
||||||
|
from tests.security_utils import security_off_wrap
|
||||||
|
|
||||||
|
|
||||||
class Net(nn.Cell):
|
class Net(nn.Cell):
|
||||||
|
@ -52,6 +53,7 @@ y = np.array([[7, 8, 9], [10, 11, 12]]).astype(np.float32)
|
||||||
@pytest.mark.platform_arm_ascend_training
|
@pytest.mark.platform_arm_ascend_training
|
||||||
@pytest.mark.platform_x86_ascend_training
|
@pytest.mark.platform_x86_ascend_training
|
||||||
@pytest.mark.env_onecard
|
@pytest.mark.env_onecard
|
||||||
|
@security_off_wrap
|
||||||
def test_async_dump():
|
def test_async_dump():
|
||||||
context.set_context(mode=context.GRAPH_MODE, device_target="Ascend")
|
context.set_context(mode=context.GRAPH_MODE, device_target="Ascend")
|
||||||
pwd = os.getcwd()
|
pwd = os.getcwd()
|
||||||
|
@ -104,6 +106,7 @@ def run_e2e_dump():
|
||||||
@pytest.mark.platform_arm_ascend_training
|
@pytest.mark.platform_arm_ascend_training
|
||||||
@pytest.mark.platform_x86_ascend_training
|
@pytest.mark.platform_x86_ascend_training
|
||||||
@pytest.mark.env_onecard
|
@pytest.mark.env_onecard
|
||||||
|
@security_off_wrap
|
||||||
def test_e2e_dump():
|
def test_e2e_dump():
|
||||||
context.set_context(mode=context.GRAPH_MODE, device_target="Ascend")
|
context.set_context(mode=context.GRAPH_MODE, device_target="Ascend")
|
||||||
run_e2e_dump()
|
run_e2e_dump()
|
||||||
|
@ -113,6 +116,7 @@ def test_e2e_dump():
|
||||||
@pytest.mark.platform_arm_ascend_training
|
@pytest.mark.platform_arm_ascend_training
|
||||||
@pytest.mark.platform_x86_ascend_training
|
@pytest.mark.platform_x86_ascend_training
|
||||||
@pytest.mark.env_onecard
|
@pytest.mark.env_onecard
|
||||||
|
@security_off_wrap
|
||||||
def test_e2e_dump_with_hccl_env():
|
def test_e2e_dump_with_hccl_env():
|
||||||
context.set_context(mode=context.GRAPH_MODE, device_target="Ascend")
|
context.set_context(mode=context.GRAPH_MODE, device_target="Ascend")
|
||||||
os.environ["RANK_TABLE_FILE"] = "invalid_file.json"
|
os.environ["RANK_TABLE_FILE"] = "invalid_file.json"
|
||||||
|
@ -123,6 +127,7 @@ def test_e2e_dump_with_hccl_env():
|
||||||
@pytest.mark.level0
|
@pytest.mark.level0
|
||||||
@pytest.mark.platform_x86_cpu
|
@pytest.mark.platform_x86_cpu
|
||||||
@pytest.mark.env_onecard
|
@pytest.mark.env_onecard
|
||||||
|
@security_off_wrap
|
||||||
def test_cpu_e2e_dump():
|
def test_cpu_e2e_dump():
|
||||||
context.set_context(mode=context.GRAPH_MODE, device_target="CPU")
|
context.set_context(mode=context.GRAPH_MODE, device_target="CPU")
|
||||||
run_e2e_dump()
|
run_e2e_dump()
|
||||||
|
@ -131,6 +136,7 @@ def test_cpu_e2e_dump():
|
||||||
@pytest.mark.level0
|
@pytest.mark.level0
|
||||||
@pytest.mark.platform_x86_cpu
|
@pytest.mark.platform_x86_cpu
|
||||||
@pytest.mark.env_onecard
|
@pytest.mark.env_onecard
|
||||||
|
@security_off_wrap
|
||||||
def test_cpu_e2e_dump_with_hccl_set():
|
def test_cpu_e2e_dump_with_hccl_set():
|
||||||
context.set_context(mode=context.GRAPH_MODE, device_target="CPU")
|
context.set_context(mode=context.GRAPH_MODE, device_target="CPU")
|
||||||
os.environ["RANK_TABLE_FILE"] = "invalid_file.json"
|
os.environ["RANK_TABLE_FILE"] = "invalid_file.json"
|
||||||
|
@ -141,6 +147,7 @@ def test_cpu_e2e_dump_with_hccl_set():
|
||||||
@pytest.mark.level0
|
@pytest.mark.level0
|
||||||
@pytest.mark.platform_x86_gpu_training
|
@pytest.mark.platform_x86_gpu_training
|
||||||
@pytest.mark.env_onecard
|
@pytest.mark.env_onecard
|
||||||
|
@security_off_wrap
|
||||||
def test_gpu_e2e_dump():
|
def test_gpu_e2e_dump():
|
||||||
context.set_context(mode=context.GRAPH_MODE, device_target="GPU")
|
context.set_context(mode=context.GRAPH_MODE, device_target="GPU")
|
||||||
run_e2e_dump()
|
run_e2e_dump()
|
||||||
|
@ -149,6 +156,7 @@ def test_gpu_e2e_dump():
|
||||||
@pytest.mark.level0
|
@pytest.mark.level0
|
||||||
@pytest.mark.platform_x86_gpu_training
|
@pytest.mark.platform_x86_gpu_training
|
||||||
@pytest.mark.env_onecard
|
@pytest.mark.env_onecard
|
||||||
|
@security_off_wrap
|
||||||
def test_gpu_e2e_dump_with_hccl_set():
|
def test_gpu_e2e_dump_with_hccl_set():
|
||||||
context.set_context(mode=context.GRAPH_MODE, device_target="GPU")
|
context.set_context(mode=context.GRAPH_MODE, device_target="GPU")
|
||||||
os.environ["RANK_TABLE_FILE"] = "invalid_file.json"
|
os.environ["RANK_TABLE_FILE"] = "invalid_file.json"
|
||||||
|
@ -175,6 +183,7 @@ class ReluReduceMeanDenseRelu(Cell):
|
||||||
@pytest.mark.platform_arm_ascend_training
|
@pytest.mark.platform_arm_ascend_training
|
||||||
@pytest.mark.platform_x86_ascend_training
|
@pytest.mark.platform_x86_ascend_training
|
||||||
@pytest.mark.env_onecard
|
@pytest.mark.env_onecard
|
||||||
|
@security_off_wrap
|
||||||
def test_async_dump_net_multi_layer_mode1():
|
def test_async_dump_net_multi_layer_mode1():
|
||||||
context.set_context(mode=context.GRAPH_MODE, device_target="Ascend")
|
context.set_context(mode=context.GRAPH_MODE, device_target="Ascend")
|
||||||
pwd = os.getcwd()
|
pwd = os.getcwd()
|
||||||
|
@ -218,6 +227,7 @@ def test_async_dump_net_multi_layer_mode1():
|
||||||
@pytest.mark.platform_arm_ascend_training
|
@pytest.mark.platform_arm_ascend_training
|
||||||
@pytest.mark.platform_x86_ascend_training
|
@pytest.mark.platform_x86_ascend_training
|
||||||
@pytest.mark.env_onecard
|
@pytest.mark.env_onecard
|
||||||
|
@security_off_wrap
|
||||||
def test_dump_with_diagnostic_path():
|
def test_dump_with_diagnostic_path():
|
||||||
"""
|
"""
|
||||||
Test e2e dump when path is not set (set to empty) in dump json file and MS_DIAGNOSTIC_DATA_PATH is set.
|
Test e2e dump when path is not set (set to empty) in dump json file and MS_DIAGNOSTIC_DATA_PATH is set.
|
||||||
|
@ -260,6 +270,7 @@ def run_e2e_dump_execution_graph():
|
||||||
@pytest.mark.level0
|
@pytest.mark.level0
|
||||||
@pytest.mark.platform_x86_gpu_training
|
@pytest.mark.platform_x86_gpu_training
|
||||||
@pytest.mark.env_onecard
|
@pytest.mark.env_onecard
|
||||||
|
@security_off_wrap
|
||||||
def test_dump_with_execution_graph():
|
def test_dump_with_execution_graph():
|
||||||
"""Test dump with execution graph on GPU."""
|
"""Test dump with execution graph on GPU."""
|
||||||
context.set_context(mode=context.GRAPH_MODE, device_target='GPU')
|
context.set_context(mode=context.GRAPH_MODE, device_target='GPU')
|
||||||
|
|
|
@ -20,11 +20,13 @@ import shutil
|
||||||
import numpy as np
|
import numpy as np
|
||||||
import mindspore.offline_debug.dbg_services as d
|
import mindspore.offline_debug.dbg_services as d
|
||||||
from dump_test_utils import compare_actual_with_expected, build_dump_structure
|
from dump_test_utils import compare_actual_with_expected, build_dump_structure
|
||||||
|
from tests.security_utils import security_off_wrap
|
||||||
|
|
||||||
GENERATE_GOLDEN = False
|
GENERATE_GOLDEN = False
|
||||||
test_name = "sync_read_tensors"
|
test_name = "sync_read_tensors"
|
||||||
|
|
||||||
|
|
||||||
|
@security_off_wrap
|
||||||
def test_sync_trans_false_read_tensors():
|
def test_sync_trans_false_read_tensors():
|
||||||
|
|
||||||
# input tensor with zero slot
|
# input tensor with zero slot
|
||||||
|
|
|
@ -19,11 +19,13 @@ import shutil
|
||||||
import numpy as np
|
import numpy as np
|
||||||
import mindspore.offline_debug.dbg_services as d
|
import mindspore.offline_debug.dbg_services as d
|
||||||
from dump_test_utils import compare_actual_with_expected, build_dump_structure
|
from dump_test_utils import compare_actual_with_expected, build_dump_structure
|
||||||
|
from tests.security_utils import security_off_wrap
|
||||||
|
|
||||||
GENERATE_GOLDEN = False
|
GENERATE_GOLDEN = False
|
||||||
test_name = "sync_read_tensors_base_stat"
|
test_name = "sync_read_tensors_base_stat"
|
||||||
|
|
||||||
|
|
||||||
|
@security_off_wrap
|
||||||
def test_sync_read_tensors_base_stat():
|
def test_sync_read_tensors_base_stat():
|
||||||
|
|
||||||
value_tensor = np.array([[7.5, 8.56, -9.78], [10.0, -11.0, 0.0]], np.float32)
|
value_tensor = np.array([[7.5, 8.56, -9.78], [10.0, -11.0, 0.0]], np.float32)
|
||||||
|
|
|
@ -20,11 +20,13 @@ import shutil
|
||||||
import numpy as np
|
import numpy as np
|
||||||
import mindspore.offline_debug.dbg_services as d
|
import mindspore.offline_debug.dbg_services as d
|
||||||
from dump_test_utils import compare_actual_with_expected, build_dump_structure
|
from dump_test_utils import compare_actual_with_expected, build_dump_structure
|
||||||
|
from tests.security_utils import security_off_wrap
|
||||||
|
|
||||||
GENERATE_GOLDEN = False
|
GENERATE_GOLDEN = False
|
||||||
test_name = "sync_read_tensors_nonexist_node"
|
test_name = "sync_read_tensors_nonexist_node"
|
||||||
|
|
||||||
|
|
||||||
|
@security_off_wrap
|
||||||
def test_sync_trans_read_tensors_nonexist_node():
|
def test_sync_trans_read_tensors_nonexist_node():
|
||||||
|
|
||||||
tensor1 = np.array([32.0, 4096.0], np.float32)
|
tensor1 = np.array([32.0, 4096.0], np.float32)
|
||||||
|
|
|
@ -20,11 +20,13 @@ import shutil
|
||||||
import numpy as np
|
import numpy as np
|
||||||
import mindspore.offline_debug.dbg_services as d
|
import mindspore.offline_debug.dbg_services as d
|
||||||
from dump_test_utils import compare_actual_with_expected, build_dump_structure
|
from dump_test_utils import compare_actual_with_expected, build_dump_structure
|
||||||
|
from tests.security_utils import security_off_wrap
|
||||||
|
|
||||||
GENERATE_GOLDEN = False
|
GENERATE_GOLDEN = False
|
||||||
test_name = "sync_watchpoints"
|
test_name = "sync_watchpoints"
|
||||||
|
|
||||||
|
|
||||||
|
@security_off_wrap
|
||||||
def test_sync_trans_false_watchpoints():
|
def test_sync_trans_false_watchpoints():
|
||||||
|
|
||||||
if GENERATE_GOLDEN:
|
if GENERATE_GOLDEN:
|
||||||
|
|
Loading…
Reference in New Issue