onnxruntime/onnxruntime/test/framework/allocation_planner_test.cc
Ke Zhang 3bf0e364e2
Move CopyTensor out of IExecutionProvider interface. (#1268)
* add ortdevice class

* add data transfer manager for copying tensors.

* update

* add data trasnfer for gpu

* fix constexpr build break.

* update

* remove unnecessary header files.

* remove unnecessary header files.

* add dependency

* add dependency

* add dependency

* add dependency

* fix linux build break.

* update

* fix build break

* fix build break

* fix build break

* update

* update

* update c api.

* update to not use OrtCreateAllocatorInfo

* change to all eps .

* fix linux build break

* remove useless codes.

* update

* move datatransfermanager in session state

* update

* fix cuda build break.

* fix comments

* fix windows GPU build.

* fix comments

* fix build break

* fix comments

* fix test failure

* update

* fix comments

* fix onnx runtime server.

* update

* fix test failure.

* fix comments

* fix comment
2019-07-11 14:49:20 -07:00

442 lines
16 KiB
C++

// Copyright (c) Microsoft Corporation. All rights reserved.
// Licensed under the MIT License.
#include <string>
#include <unordered_map>
#include <unordered_set>
#include <sstream>
#include "core/framework/session_state.h"
#include "core/graph/model.h"
#include "gtest/gtest.h"
#include "core/framework/op_kernel.h"
#include "test/framework/model_builder_utils.h"
#include "core/framework/allocation_planner.h"
#include "core/providers/cpu/cpu_execution_provider.h"
using namespace ONNX_NAMESPACE;
namespace onnxruntime {
namespace test {
namespace modelbuilder {
class NodeCounter {
private:
static int node_count_;
public:
static int Next() { return ++node_count_; }
};
int NodeCounter::node_count_ = 0;
struct UnaryNode {
std::vector<onnxruntime::NodeArg*> input_args;
std::vector<onnxruntime::NodeArg*> output_args;
onnxruntime::Node* p_node;
UnaryNode(onnxruntime::Graph& graph, const std::string& op,
onnxruntime::NodeArg* p_input_arg, onnxruntime::NodeArg* p_output_arg)
: input_args({p_input_arg}), output_args({p_output_arg}) {
int num = NodeCounter::Next();
p_node = &graph.AddNode("node" + std::to_string(num), op, "test op", input_args, output_args);
}
UnaryNode(onnxruntime::Graph& graph, onnxruntime::NodeArg* p_input_arg, onnxruntime::NodeArg* p_output_arg)
: UnaryNode(graph, "Transpose", p_input_arg, p_output_arg) {}
};
class DummyOpKernel : public OpKernel {
public:
DummyOpKernel(const OpKernelInfo& p) : OpKernel(p) {}
Status Compute(OpKernelContext* context) const {
ORT_UNUSED_PARAMETER(context);
return Status::OK();
}
Status ComputeAsync(OpKernelContext* context, DoneCallback done) const {
ORT_UNUSED_PARAMETER(context);
ORT_UNUSED_PARAMETER(done);
return Status::OK();
}
};
} // namespace modelbuilder
using namespace modelbuilder;
class AllocationPlanTestUtility {
public:
static void CheckAllocationKind(const SequentialExecutionPlan& plan, std::vector<AllocKind>& expected) {
ASSERT_EQ(plan.allocation_plan.size(), expected.size()) << "Allocation plan of wrong size";
for (size_t i = 0; i < expected.size(); ++i) {
EXPECT_EQ(plan.allocation_plan[i].alloc_kind, expected[i]) << "Error in allocation kind at position " << i;
}
}
static void CheckToBeFreed(const SequentialExecutionPlan& plan, const std::vector<OrtValueIndex>& expected) {
ASSERT_EQ(plan.to_be_freed.size(), expected.size()) << "Allocation plan's to_be_freed of wrong size";
for (size_t i = 0; i < expected.size(); ++i) {
EXPECT_EQ(plan.to_be_freed[i], expected[i]) << "Error in to_be_freed at position " << i;
}
}
static void CheckFreedAtEachStep(const SequentialExecutionPlan& plan, const std::vector<int>& expected_num_freed) {
ASSERT_EQ(plan.execution_plan.size(), expected_num_freed.size()) << "Execution plan is of wrong size";
int start = 0;
for (size_t i = 0; i < expected_num_freed.size(); ++i) {
if (expected_num_freed[i] > 0) {
EXPECT_EQ(plan.execution_plan[i].free_from_index, start) << "Error in free_from_index at position " << i;
EXPECT_EQ(plan.execution_plan[i].free_to_index, start + expected_num_freed[i] - 1)
<< "Error in free_to_index at position " << i;
start = start + expected_num_freed[i];
} else {
// "free_from_index > free_to_index" indicates nothing is to be freed
EXPECT_GT(plan.execution_plan[i].free_from_index, plan.execution_plan[i].free_to_index);
}
}
}
static void BasicIntegrityCheck(const SequentialExecutionPlan& plan, size_t num_ml_values) {
// Sanity checks for plan.to_be_freed
std::unordered_set<OrtValueIndex> freed;
for (OrtValueIndex index : plan.to_be_freed) {
// Every index should be in the valid range [0, num_ml_values-1]
EXPECT_GE(index, 0);
EXPECT_LT(index, num_ml_values);
// An index should not be freed more than once
EXPECT_EQ(freed.count(index), 0) << "OrtValue " << index << " freed multiple times";
freed.insert(index);
}
// Check the free-index information for every execution step: they should cover the
// range [0, plan.to_be_freed.size()-1] properly.
int next_free_index = 0;
int max_free_index = ((int)plan.to_be_freed.size()) - 1;
for (const SequentialExecutionPlan::NodeExecutionPlan& step : plan.execution_plan) {
if (step.free_from_index <= step.free_to_index) {
EXPECT_EQ(step.free_from_index, next_free_index);
EXPECT_LE(step.free_to_index, max_free_index);
next_free_index = step.free_to_index + 1;
} // else nothing needs to be freed in this step
}
}
};
typedef std::unordered_map<const onnxruntime::NodeArg*, TensorShapeProto*> ShapeMap;
class SequentialPlannerTestContext : public ISequentialPlannerContext {
public:
SequentialPlannerTestContext(ShapeMap* shape_map) : shape_map_(shape_map) {}
TensorShapeProto* GetShape(const onnxruntime::NodeArg& arg) const override {
auto iter = shape_map_->find(&arg);
return (shape_map_->end() != iter) ? iter->second : nullptr;
}
private:
ShapeMap* shape_map_;
};
class PlannerTest : public ::testing::Test {
private:
void index(const std::string& name, int& out) {
ASSERT_TRUE(state_.GetOrtValueNameIdxMap().GetIdx(name, out).IsOK());
}
onnxruntime::Model model_;
onnxruntime::Graph& graph_;
// some standard components used to build test-cases:
Type float_type_;
std::unique_ptr<::onnxruntime::KernelDef> std_kernel_; // a unary kernel with no-aliasing and no-in-place
std::unique_ptr<::onnxruntime::KernelDef> in_place_kernel_; // a unary kernel with in-place
std::unordered_map<std::string, onnxruntime::NodeArg*> name_to_arg_;
std::vector<std::unique_ptr<UnaryNode>> nodes_;
std::vector<std::unique_ptr<OpKernelInfo>> op_kernel_infos_;
std::vector<std::pair<onnxruntime::Node*, KernelDef&>> kernel_bindings_;
ExecutionProviders execution_providers_;
SessionState state_;
ShapeMap shape_map_;
std::unique_ptr<SequentialExecutionPlan> plan_;
public:
PlannerTest() : model_("test"), graph_{model_.MainGraph()}, state_{execution_providers_, false} {
std_kernel_ = KernelDefBuilder().SetName("Transpose").Build();
in_place_kernel_ = KernelDefBuilder().SetName("Clip").MayInplace(0, 0).Build();
CPUExecutionProviderInfo epi;
auto execution_provider = std::make_unique<CPUExecutionProvider>(epi);
execution_providers_.Add("CPUExecutionProvider", std::move(execution_provider));
}
~PlannerTest() = default;
onnxruntime::NodeArg* Arg(const std::string& name) {
auto iter = name_to_arg_.find(name);
if (name_to_arg_.end() != iter) return iter->second;
return (name_to_arg_[name] = &graph_.GetOrCreateNodeArg(name, &float_type_.value));
}
onnxruntime::Node* AddNode(::onnxruntime::KernelDef& kernel_def, std::string& input, std::string& output) {
auto node = std::make_unique<UnaryNode>(graph_, kernel_def.OpName(), Arg(input), Arg(output));
auto* p_node = node->p_node;
p_node->SetExecutionProviderType(onnxruntime::kCpuExecutionProvider);
nodes_.push_back(std::move(node));
kernel_bindings_.emplace_back(p_node, kernel_def);
return p_node;
}
onnxruntime::Node* AddNormalNode(std::string& input, std::string& output) {
return AddNode(*std_kernel_, input, output);
}
onnxruntime::Node* AddInplaceNode(std::string& input, std::string& output) {
return AddNode(*in_place_kernel_, input, output);
}
void BindKernel(onnxruntime::Node* p_node, ::onnxruntime::KernelDef& kernel_def) {
auto info = std::make_unique<OpKernelInfo>(*p_node, kernel_def, *execution_providers_.Get(*p_node),
state_.GetInitializedTensors(), state_.GetOrtValueNameIdxMap(),
state_.GetFuncMgr(), state_.GetDataTransferMgr());
auto dummy = std::make_unique<DummyOpKernel>(*info);
op_kernel_infos_.push_back(std::move(info));
state_.AddKernel(p_node->Index(), std::move(dummy));
}
void SetShape(std::string& name, TensorShapeProto* shape) {
shape_map_[Arg(name)] = shape;
}
void SetShape(std::initializer_list<std::pair<std::string&, TensorShapeProto*>> shapes) {
for (auto& pair : shapes) {
SetShape(pair.first, pair.second);
}
}
void CreatePlan(const std::vector<const NodeArg*>& outer_scope_node_args = {}) {
EXPECT_EQ(graph_.Resolve(), Status::OK());
state_.SetGraphViewer(std::make_unique<GraphViewer>(graph_));
OrtValueNameIdxMap& mlvalue_name_idx_map{state_.GetOrtValueNameIdxMap()};
int count = 0;
for (auto& pair : name_to_arg_) {
EXPECT_EQ(mlvalue_name_idx_map.Add(pair.first), count++);
}
for (auto& binding : kernel_bindings_) {
BindKernel(binding.first, binding.second);
}
auto cpu_execution_provider = std::make_unique<CPUExecutionProvider>(CPUExecutionProviderInfo());
KernelRegistryManager kernel_registry_manager;
ExecutionProviders execution_providers;
execution_providers.Add(onnxruntime::kCpuExecutionProvider, std::move(cpu_execution_provider));
auto status = kernel_registry_manager.RegisterKernels(execution_providers);
EXPECT_TRUE(status.IsOK()) << status.ErrorMessage();
SequentialPlannerTestContext test_context(&shape_map_);
status = SequentialPlanner::CreatePlan(nullptr, GraphViewer(graph_), outer_scope_node_args, execution_providers,
kernel_registry_manager, mlvalue_name_idx_map, test_context, plan_);
EXPECT_TRUE(status.IsOK()) << status.ErrorMessage();
AllocationPlanTestUtility::BasicIntegrityCheck(*plan_, name_to_arg_.size());
}
void CheckAllocKind(const std::string& name, AllocKind kind) {
int id;
index(name, id);
EXPECT_EQ(plan_->allocation_plan[id].alloc_kind, kind) << "Error in allocation kind for " << name;
}
void CheckFreed(int step_number, std::initializer_list<std::string> freed_items) {
// create set and check equality
std::unordered_set<int> expected;
for (auto& name : freed_items) {
int id;
index(name, id);
expected.insert(id);
}
std::unordered_set<int> plan_result;
auto& step_plan = plan_->execution_plan[step_number];
for (int i = step_plan.free_from_index; i <= step_plan.free_to_index; ++i)
plan_result.insert(plan_->to_be_freed[i]);
EXPECT_EQ(plan_result, expected) << "Freed items incorrect for step " << step_number;
}
protected:
Graph& GetGraph() { return graph_; }
const SequentialExecutionPlan& GetPlan() const { return *plan_; }
const SessionState& GetState() const { return state_; }
};
TEST_F(PlannerTest, ChainTest) {
// tensor variables:
std::string W("W"), X("X"), B("B"), Y("Y"), Z("Z");
// graph structure:
ONNX_NAMESPACE::TensorProto tensor;
tensor.add_dims(1);
tensor.add_float_data(1.0f);
tensor.set_data_type(TensorProto_DataType_FLOAT);
tensor.set_name("W");
GetGraph().AddInitializedTensor(tensor);
AddNormalNode(W, X);
AddNormalNode(X, B);
AddNormalNode(B, Y);
AddNormalNode(Y, Z);
// simulate shape-inference results:
Shape shape1{50, 100};
auto shape = &shape1.value;
SetShape({{X, shape}, {B, shape}, {Y, shape}, {Z, shape}});
CreatePlan();
// Expected plan:
// W: kAllocateStatically; X: kAllocate; B: kAllocate; Y: kReuse (X); post-node3: free(B); X is returned output
CheckAllocKind(W, AllocKind::kAllocateStatically);
CheckAllocKind(X, AllocKind::kAllocate);
CheckAllocKind(B, AllocKind::kAllocate);
CheckAllocKind(Y, AllocKind::kReuse);
CheckAllocKind(Z, AllocKind::kAllocateOutput);
CheckFreed(0, {});
CheckFreed(1, {});
CheckFreed(2, {"B"});
CheckFreed(3, {"X"});
}
/* InputOutputTest: Test that:
(a) All inputs are classified as kPreExisting,
(b) All outer scope node args are classified as kPreExisting,
(c) All outputs are classified as kAllocate (in this example),
(d) Neither input nor outputs are freed.
*/
TEST_F(PlannerTest, InputOutputTest) {
// tensor variables:
std::string X1("X1"), X2("X2"), Y1("Y1"), Y2("Y2"), Outer1("Outer1"), Y3("Y3");
// graph structure:
AddNormalNode(X1, Y1);
AddNormalNode(X2, Y2);
// add node that consumes an outer scope node arg
auto outer_node = AddNormalNode(Outer1, Y3);
const NodeArg* outer_scope_node_arg = outer_node->InputDefs().at(0);
GetGraph().AddOuterScopeNodeArg(Outer1);
// simulate no shape-inference:
CreatePlan({outer_scope_node_arg});
// X1: kPreExisting, X2: kPreExisting, Outer1: kPreExisting, Y1: kAllocate, Y2: kAllocate, Y3: kAllocate
CheckAllocKind(X1, AllocKind::kPreExisting);
CheckAllocKind(X2, AllocKind::kPreExisting);
CheckAllocKind(Outer1, AllocKind::kPreExisting);
CheckAllocKind(Y1, AllocKind::kAllocateOutput);
CheckAllocKind(Y2, AllocKind::kAllocateOutput);
CheckAllocKind(Y3, AllocKind::kAllocateOutput);
// Nothing should be freed (since they are either inputs or outputs)
CheckFreed(0, {});
CheckFreed(1, {});
CheckFreed(2, {});
}
// InPlaceTest: Check that we reuse when Inplace allows us to.
TEST_F(PlannerTest, InPlaceTest) {
// tensor variables:
std::string X1("X1"), X2("X2"), X3("X3"), X4("X4");
// graph structure:
AddNormalNode(X1, X2); // no in-place operator; X1: input; X2: temporary
AddInplaceNode(X2, X3); // may-in-place operator; X3: temporary
AddNormalNode(X3, X4); // no in-place operator; X4: output
// simulate shape-inference results:
Shape shape1{"M", "N"};
auto shape = &shape1.value;
SetShape({{X1, shape}, {X2, shape}, {X3, shape}, {X4, shape}});
CreatePlan();
// check allocation kind:
CheckAllocKind(X1, AllocKind::kPreExisting);
CheckAllocKind(X2, AllocKind::kAllocate);
CheckAllocKind(X3, AllocKind::kReuse);
CheckAllocKind(X4, AllocKind::kAllocateOutput);
// check each ml-value is freed at appropriate step
CheckFreed(0, {});
CheckFreed(1, {});
CheckFreed(2, {X2});
}
// InPlaceSizeMismatchTest: Check that Inplace reuse is not allowed when sizes don't match.
// Also tests reuse of disjoint lifetime tensors.
TEST_F(PlannerTest, InPlaceSizeMismatchTest) {
// tensor variables:
std::string X1("X1"), X2("X2"), X3("X3"), X4("X4"), X5("X5");
// graph structure:
AddNormalNode(X1, X2); // no in-place operator; X1: input; X2: temporary
AddInplaceNode(X2, X3); // may-in-place operator; X3: temporary
AddNormalNode(X3, X4); // no in-place operator; X4: temporary
AddInplaceNode(X4, X5); // may-in-place operator; X5 output
// simulate shape-inference results:
Shape shape1w{"M", "N"};
auto shape1 = &shape1w.value;
Shape shape2w{"M", "K"};
auto shape2 = &shape2w.value;
SetShape({{X1, shape1}, {X2, shape1}, {X3, shape2}, {X4, shape1}, {X5, shape1}});
CreatePlan();
// check allocation kind:
CheckAllocKind(X1, AllocKind::kPreExisting);
CheckAllocKind(X2, AllocKind::kAllocate);
CheckAllocKind(X3, AllocKind::kAllocate);
CheckAllocKind(X4, AllocKind::kReuse);
CheckAllocKind(X5, AllocKind::kAllocateOutput);
// check each ml-value is freed at appropriate step
CheckFreed(0, {});
CheckFreed(1, {});
CheckFreed(2, {X3});
CheckFreed(3, {X2});
}
// Test operator<< to output details of an allocation & execution plan.
TEST_F(PlannerTest, PlanOutputTest) {
// tensor variables:
std::string X1("X1"), X2("X2"), X3("X3"), X4("X4");
// graph structure:
AddNormalNode(X1, X2); // no in-place operator; X1: input; X2: temporary
AddInplaceNode(X2, X3); // may-in-place operator; X3: temporary
AddNormalNode(X3, X4); // no in-place operator; X4: output
// simulate shape-inference results:
Shape shape1{"M", "N"};
auto shape = &shape1.value;
SetShape({{X1, shape}, {X2, shape}, {X3, shape}, {X4, shape}});
CreatePlan();
try {
std::ostringstream output;
output << std::make_pair(&GetPlan(), &GetState());
auto output_size = output.str().size();
// Currently, we don't check details of the output, as it may change over time.
EXPECT_GT(output_size, 0);
} catch (const std::exception& ex) {
EXPECT_TRUE(false) << "Exception in producing output: " << ex.what();
}
}
} // namespace test
} // namespace onnxruntime