onnxruntime/onnxruntime/test/framework/allocation_planner_test.cc
Dmitri Smirnov d1b1cdc5c4
Replace GSL with GSL-LITE submodule and fix up refs (#1920)
Remove gsl subodule and replace with a local copy of gsl-lite
  Refactor for onnxruntime::make_unique
  gsl::span size and index are now size_t
  Remove lambda auto argument type detection.
  Remove constexpr from fail_fast in gsl due to Linux not being happy.
  Comment out std::stream support due to MacOS std lib broken.
  Move make_unique into include/core/common so it is accessible for server builds.
  Relax requirements for onnxruntime/test/providers/cpu/ml/write_scores_test.cc
  due to x86 build.
  Add ONNXRUNTIME_ROOT to Server Lib includes so gsl is recognized
2019-10-01 12:43:29 -07:00

445 lines
16 KiB
C++

// Copyright (c) Microsoft Corporation. All rights reserved.
// Licensed under the MIT License.
#include <string>
#include <unordered_map>
#include <unordered_set>
#include <sstream>
#include "core/framework/session_state.h"
#include "core/graph/model.h"
#include "gtest/gtest.h"
#include "core/framework/op_kernel.h"
#include "test/framework/model_builder_utils.h"
#include "core/framework/allocation_planner.h"
#include "core/providers/cpu/cpu_execution_provider.h"
using namespace ONNX_NAMESPACE;
namespace onnxruntime {
namespace test {
namespace modelbuilder {
class NodeCounter {
private:
static int node_count_;
public:
static int Next() { return ++node_count_; }
};
int NodeCounter::node_count_ = 0;
struct UnaryNode {
std::vector<onnxruntime::NodeArg*> input_args;
std::vector<onnxruntime::NodeArg*> output_args;
onnxruntime::Node* p_node;
UnaryNode(onnxruntime::Graph& graph, const std::string& op, onnxruntime::NodeArg* p_input_arg,
onnxruntime::NodeArg* p_output_arg)
: input_args({p_input_arg}), output_args({p_output_arg}) {
int num = NodeCounter::Next();
p_node = &graph.AddNode("node" + std::to_string(num), op, "test op", input_args, output_args);
}
UnaryNode(onnxruntime::Graph& graph, onnxruntime::NodeArg* p_input_arg, onnxruntime::NodeArg* p_output_arg)
: UnaryNode(graph, "Transpose", p_input_arg, p_output_arg) {}
};
class DummyOpKernel : public OpKernel {
public:
DummyOpKernel(const OpKernelInfo& p) : OpKernel(p) {}
Status Compute(OpKernelContext* context) const {
ORT_UNUSED_PARAMETER(context);
return Status::OK();
}
Status ComputeAsync(OpKernelContext* context, DoneCallback done) const {
ORT_UNUSED_PARAMETER(context);
ORT_UNUSED_PARAMETER(done);
return Status::OK();
}
};
} // namespace modelbuilder
using namespace modelbuilder;
class AllocationPlanTestUtility {
public:
static void CheckAllocationKind(const SequentialExecutionPlan& plan, std::vector<AllocKind>& expected) {
ASSERT_EQ(plan.allocation_plan.size(), expected.size()) << "Allocation plan of wrong size";
for (size_t i = 0; i < expected.size(); ++i) {
EXPECT_EQ(plan.allocation_plan[i].alloc_kind, expected[i]) << "Error in allocation kind at position " << i;
}
}
static void CheckToBeFreed(const SequentialExecutionPlan& plan, const std::vector<OrtValueIndex>& expected) {
ASSERT_EQ(plan.to_be_freed.size(), expected.size()) << "Allocation plan's to_be_freed of wrong size";
for (size_t i = 0; i < expected.size(); ++i) {
EXPECT_EQ(plan.to_be_freed[i], expected[i]) << "Error in to_be_freed at position " << i;
}
}
static void CheckFreedAtEachStep(const SequentialExecutionPlan& plan, const std::vector<int>& expected_num_freed) {
ASSERT_EQ(plan.execution_plan.size(), expected_num_freed.size()) << "Execution plan is of wrong size";
int start = 0;
for (size_t i = 0; i < expected_num_freed.size(); ++i) {
if (expected_num_freed[i] > 0) {
EXPECT_EQ(plan.execution_plan[i].free_from_index, start) << "Error in free_from_index at position " << i;
EXPECT_EQ(plan.execution_plan[i].free_to_index, start + expected_num_freed[i] - 1)
<< "Error in free_to_index at position " << i;
start = start + expected_num_freed[i];
} else {
// "free_from_index > free_to_index" indicates nothing is to be freed
EXPECT_GT(plan.execution_plan[i].free_from_index, plan.execution_plan[i].free_to_index);
}
}
}
static void BasicIntegrityCheck(const SequentialExecutionPlan& plan, size_t num_ml_values) {
// Sanity checks for plan.to_be_freed
std::unordered_set<OrtValueIndex> freed;
for (OrtValueIndex index : plan.to_be_freed) {
// Every index should be in the valid range [0, num_ml_values-1]
EXPECT_GE(index, 0);
EXPECT_LT(index, num_ml_values);
// An index should not be freed more than once
EXPECT_EQ(freed.count(index), 0) << "OrtValue " << index << " freed multiple times";
freed.insert(index);
}
// Check the free-index information for every execution step: they should cover the
// range [0, plan.to_be_freed.size()-1] properly.
int next_free_index = 0;
int max_free_index = ((int)plan.to_be_freed.size()) - 1;
for (const SequentialExecutionPlan::NodeExecutionPlan& step : plan.execution_plan) {
if (step.free_from_index <= step.free_to_index) {
EXPECT_EQ(step.free_from_index, next_free_index);
EXPECT_LE(step.free_to_index, max_free_index);
next_free_index = step.free_to_index + 1;
} // else nothing needs to be freed in this step
}
}
};
typedef std::unordered_map<const onnxruntime::NodeArg*, TensorShapeProto*> ShapeMap;
class SequentialPlannerTestContext : public ISequentialPlannerContext {
public:
SequentialPlannerTestContext(ShapeMap* shape_map) : shape_map_(shape_map) {}
TensorShapeProto* GetShape(const onnxruntime::NodeArg& arg) const override {
auto iter = shape_map_->find(&arg);
return (shape_map_->end() != iter) ? iter->second : nullptr;
}
private:
ShapeMap* shape_map_;
};
class PlannerTest : public ::testing::Test {
private:
void index(const std::string& name, int& out) {
ASSERT_TRUE(state_.GetOrtValueNameIdxMap().GetIdx(name, out).IsOK());
}
onnxruntime::Model model_;
onnxruntime::Graph& graph_;
// some standard components used to build test-cases:
Type float_type_;
std::unique_ptr<::onnxruntime::KernelDef> std_kernel_; // a unary kernel with no-aliasing and no-in-place
std::unique_ptr<::onnxruntime::KernelDef> in_place_kernel_; // a unary kernel with in-place
std::unordered_map<std::string, onnxruntime::NodeArg*> name_to_arg_;
std::vector<std::unique_ptr<UnaryNode>> nodes_;
std::vector<std::unique_ptr<OpKernelInfo>> op_kernel_infos_;
std::vector<std::pair<onnxruntime::Node*, KernelDef&>> kernel_bindings_;
ExecutionProviders execution_providers_;
concurrency::ThreadPool tp_;
SessionState state_;
ShapeMap shape_map_;
std::unique_ptr<SequentialExecutionPlan> plan_;
public:
PlannerTest()
: model_("test"), graph_(model_.MainGraph()), tp_("test", 1), state_(execution_providers_, false, &tp_, nullptr) {
std_kernel_ = KernelDefBuilder().SetName("Transpose").Provider(kCpuExecutionProvider).SinceVersion(1, 10).Build();
in_place_kernel_ =
KernelDefBuilder().SetName("Relu").Provider(kCpuExecutionProvider).SinceVersion(1, 10).MayInplace(0, 0).Build();
CPUExecutionProviderInfo epi;
auto execution_provider = onnxruntime::make_unique<CPUExecutionProvider>(epi);
execution_providers_.Add("CPUExecutionProvider", std::move(execution_provider));
}
~PlannerTest() = default;
onnxruntime::NodeArg* Arg(const std::string& name) {
auto iter = name_to_arg_.find(name);
if (name_to_arg_.end() != iter) return iter->second;
return (name_to_arg_[name] = &graph_.GetOrCreateNodeArg(name, &float_type_.value));
}
onnxruntime::Node* AddNode(::onnxruntime::KernelDef& kernel_def, std::string& input, std::string& output) {
auto node = onnxruntime::make_unique<UnaryNode>(graph_, kernel_def.OpName(), Arg(input), Arg(output));
auto* p_node = node->p_node;
p_node->SetExecutionProviderType(onnxruntime::kCpuExecutionProvider);
nodes_.push_back(std::move(node));
kernel_bindings_.emplace_back(p_node, kernel_def);
return p_node;
}
onnxruntime::Node* AddNormalNode(std::string& input, std::string& output) {
return AddNode(*std_kernel_, input, output);
}
onnxruntime::Node* AddInplaceNode(std::string& input, std::string& output) {
return AddNode(*in_place_kernel_, input, output);
}
void BindKernel(onnxruntime::Node* p_node, ::onnxruntime::KernelDef& kernel_def, KernelRegistry* reg) {
auto info = onnxruntime::make_unique<OpKernelInfo>(*p_node, kernel_def, *execution_providers_.Get(*p_node),
state_.GetInitializedTensors(), state_.GetOrtValueNameIdxMap(),
state_.GetFuncMgr(), state_.GetDataTransferMgr());
op_kernel_infos_.push_back(std::move(info));
if (reg->TryFindKernel(*p_node, onnxruntime::kCpuExecutionProvider) == nullptr) {
auto st = reg->Register(
KernelCreateInfo(onnxruntime::make_unique<KernelDef>(kernel_def),
[](const OpKernelInfo& info) -> OpKernel* { return new DummyOpKernel(info); }));
ORT_ENFORCE(st.IsOK(), st.ErrorMessage());
}
}
void SetShape(std::string& name, TensorShapeProto* shape) { shape_map_[Arg(name)] = shape; }
void SetShape(std::initializer_list<std::pair<std::string&, TensorShapeProto*>> shapes) {
for (auto& pair : shapes) {
SetShape(pair.first, pair.second);
}
}
void CreatePlan(const std::vector<const NodeArg*>& outer_scope_node_args = {}) {
EXPECT_EQ(graph_.Resolve(), Status::OK());
state_.SetGraph(graph_);
std::shared_ptr<KernelRegistry> reg = std::make_shared<KernelRegistry>();
for (auto& binding : kernel_bindings_) {
BindKernel(binding.first, binding.second, reg.get());
}
auto cpu_execution_provider = onnxruntime::make_unique<CPUExecutionProvider>(CPUExecutionProviderInfo());
KernelRegistryManager kernel_registry_manager;
kernel_registry_manager.RegisterKernelRegistry(reg);
ExecutionProviders execution_providers;
execution_providers.Add(onnxruntime::kCpuExecutionProvider, std::move(cpu_execution_provider));
auto status = kernel_registry_manager.RegisterKernels(execution_providers);
EXPECT_TRUE(status.IsOK()) << status.ErrorMessage();
status = state_.CreateKernels(kernel_registry_manager);
EXPECT_TRUE(status.IsOK()) << status.ErrorMessage();
SequentialPlannerTestContext test_context(&shape_map_);
status = SequentialPlanner::CreatePlan(nullptr, GraphViewer(graph_), outer_scope_node_args, execution_providers,
kernel_registry_manager, state_.GetOrtValueNameIdxMap(), test_context, plan_);
EXPECT_TRUE(status.IsOK()) << status.ErrorMessage();
AllocationPlanTestUtility::BasicIntegrityCheck(*plan_, name_to_arg_.size());
}
void CheckAllocKind(const std::string& name, AllocKind kind) {
int id;
index(name, id);
EXPECT_EQ(plan_->allocation_plan[id].alloc_kind, kind) << "Error in allocation kind for " << name;
}
void CheckFreed(int step_number, std::initializer_list<std::string> freed_items) {
// create set and check equality
std::unordered_set<int> expected;
for (auto& name : freed_items) {
int id;
index(name, id);
expected.insert(id);
}
std::unordered_set<int> plan_result;
auto& step_plan = plan_->execution_plan[step_number];
for (int i = step_plan.free_from_index; i <= step_plan.free_to_index; ++i)
plan_result.insert(plan_->to_be_freed[i]);
EXPECT_EQ(plan_result, expected) << "Freed items incorrect for step " << step_number;
}
protected:
Graph& GetGraph() { return graph_; }
const SequentialExecutionPlan& GetPlan() const { return *plan_; }
const SessionState& GetState() const { return state_; }
};
TEST_F(PlannerTest, ChainTest) {
// tensor variables:
std::string W("W"), X("X"), B("B"), Y("Y"), Z("Z");
// graph structure:
ONNX_NAMESPACE::TensorProto tensor;
tensor.add_dims(1);
tensor.add_float_data(1.0f);
tensor.set_data_type(TensorProto_DataType_FLOAT);
tensor.set_name("W");
GetGraph().AddInitializedTensor(tensor);
AddNormalNode(W, X);
AddNormalNode(X, B);
AddNormalNode(B, Y);
AddNormalNode(Y, Z);
// simulate shape-inference results:
Shape shape1{50, 100};
auto shape = &shape1.value;
SetShape({{X, shape}, {B, shape}, {Y, shape}, {Z, shape}});
CreatePlan();
// Expected plan:
// W: kAllocateStatically; X: kAllocate; B: kAllocate; Y: kReuse (X); post-node3: free(B); X is returned output
CheckAllocKind(W, AllocKind::kAllocateStatically);
CheckAllocKind(X, AllocKind::kAllocate);
CheckAllocKind(B, AllocKind::kAllocate);
CheckAllocKind(Y, AllocKind::kReuse);
CheckAllocKind(Z, AllocKind::kAllocateOutput);
CheckFreed(0, {});
CheckFreed(1, {});
CheckFreed(2, {"B"});
CheckFreed(3, {"X"});
}
/* InputOutputTest: Test that:
(a) All inputs are classified as kPreExisting,
(b) All outer scope node args are classified as kPreExisting,
(c) All outputs are classified as kAllocate (in this example),
(d) Neither input nor outputs are freed.
*/
TEST_F(PlannerTest, InputOutputTest) {
// tensor variables:
std::string X1("X1"), X2("X2"), Y1("Y1"), Y2("Y2"), Outer1("Outer1"), Y3("Y3");
// graph structure:
AddNormalNode(X1, Y1);
AddNormalNode(X2, Y2);
// add node that consumes an outer scope node arg
auto outer_node = AddNormalNode(Outer1, Y3);
const NodeArg* outer_scope_node_arg = outer_node->InputDefs().at(0);
GetGraph().AddOuterScopeNodeArg(Outer1);
// simulate no shape-inference:
CreatePlan({outer_scope_node_arg});
// X1: kPreExisting, X2: kPreExisting, Outer1: kPreExisting, Y1: kAllocate, Y2: kAllocate, Y3: kAllocate
CheckAllocKind(X1, AllocKind::kPreExisting);
CheckAllocKind(X2, AllocKind::kPreExisting);
CheckAllocKind(Outer1, AllocKind::kPreExisting);
CheckAllocKind(Y1, AllocKind::kAllocateOutput);
CheckAllocKind(Y2, AllocKind::kAllocateOutput);
CheckAllocKind(Y3, AllocKind::kAllocateOutput);
// Nothing should be freed (since they are either inputs or outputs)
CheckFreed(0, {});
CheckFreed(1, {});
CheckFreed(2, {});
}
// InPlaceTest: Check that we reuse when Inplace allows us to.
TEST_F(PlannerTest, InPlaceTest) {
// tensor variables:
std::string X1("X1"), X2("X2"), X3("X3"), X4("X4");
// graph structure:
AddNormalNode(X1, X2); // no in-place operator; X1: input; X2: temporary
AddInplaceNode(X2, X3); // may-in-place operator; X3: temporary
AddNormalNode(X3, X4); // no in-place operator; X4: output
// simulate shape-inference results:
Shape shape1{"M", "N"};
auto shape = &shape1.value;
SetShape({{X1, shape}, {X2, shape}, {X3, shape}, {X4, shape}});
CreatePlan();
// check allocation kind:
CheckAllocKind(X1, AllocKind::kPreExisting);
CheckAllocKind(X2, AllocKind::kAllocate);
CheckAllocKind(X3, AllocKind::kReuse);
CheckAllocKind(X4, AllocKind::kAllocateOutput);
// check each ml-value is freed at appropriate step
CheckFreed(0, {});
CheckFreed(1, {});
CheckFreed(2, {X2});
}
// InPlaceSizeMismatchTest: Check that Inplace reuse is not allowed when sizes don't match.
// Also tests reuse of disjoint lifetime tensors.
TEST_F(PlannerTest, InPlaceSizeMismatchTest) {
// tensor variables:
std::string X1("X1"), X2("X2"), X3("X3"), X4("X4"), X5("X5");
// graph structure:
AddNormalNode(X1, X2); // no in-place operator; X1: input; X2: temporary
AddInplaceNode(X2, X3); // may-in-place operator; X3: temporary
AddNormalNode(X3, X4); // no in-place operator; X4: temporary
AddInplaceNode(X4, X5); // may-in-place operator; X5 output
// simulate shape-inference results:
Shape shape1w{"M", "N"};
auto shape1 = &shape1w.value;
Shape shape2w{"M", "K"};
auto shape2 = &shape2w.value;
SetShape({{X1, shape1}, {X2, shape1}, {X3, shape2}, {X4, shape1}, {X5, shape1}});
CreatePlan();
// check allocation kind:
CheckAllocKind(X1, AllocKind::kPreExisting);
CheckAllocKind(X2, AllocKind::kAllocate);
CheckAllocKind(X3, AllocKind::kAllocate);
CheckAllocKind(X4, AllocKind::kReuse);
CheckAllocKind(X5, AllocKind::kAllocateOutput);
// check each ml-value is freed at appropriate step
CheckFreed(0, {});
CheckFreed(1, {});
CheckFreed(2, {X3});
CheckFreed(3, {X2});
}
// Test operator<< to output details of an allocation & execution plan.
TEST_F(PlannerTest, PlanOutputTest) {
// tensor variables:
std::string X1("X1"), X2("X2"), X3("X3"), X4("X4");
// graph structure:
AddNormalNode(X1, X2); // no in-place operator; X1: input; X2: temporary
AddInplaceNode(X2, X3); // may-in-place operator; X3: temporary
AddNormalNode(X3, X4); // no in-place operator; X4: output
// simulate shape-inference results:
Shape shape1{"M", "N"};
auto shape = &shape1.value;
SetShape({{X1, shape}, {X2, shape}, {X3, shape}, {X4, shape}});
CreatePlan();
try {
std::ostringstream output;
output << std::make_pair(&GetPlan(), &GetState());
auto output_size = output.str().size();
// Currently, we don't check details of the output, as it may change over time.
EXPECT_GT(output_size, 0);
} catch (const std::exception& ex) {
EXPECT_TRUE(false) << "Exception in producing output: " << ex.what();
}
}
} // namespace test
} // namespace onnxruntime