onnxruntime/winml/lib/Api.Ort/OnnxruntimeCpuSessionBuilder.cpp
2020-04-17 14:10:50 -07:00

91 lines
2.9 KiB
C++

// Copyright (c) Microsoft Corporation. All rights reserved.
// Licensed under the MIT License.
#include "pch.h"
#include <thread>
#include "OnnxruntimeCpuSessionBuilder.h"
#include "OnnxruntimeEngine.h"
#include "OnnxruntimeErrors.h"
using namespace _winml;
HRESULT OnnxruntimeCpuSessionBuilder::RuntimeClassInitialize(OnnxruntimeEngineFactory* engine_factory) {
engine_factory_ = engine_factory;
return S_OK;
}
HRESULT
OnnxruntimeCpuSessionBuilder::CreateSessionOptions(
OrtSessionOptions** options) {
RETURN_HR_IF_NULL(E_POINTER, options);
auto ort_api = engine_factory_->UseOrtApi();
auto winml_adapter_api = engine_factory_->UseWinmlAdapterApi();
OrtSessionOptions* ort_options;
RETURN_HR_IF_NOT_OK_MSG(ort_api->CreateSessionOptions(&ort_options),
ort_api);
auto session_options = UniqueOrtSessionOptions(ort_options, ort_api->ReleaseSessionOptions);
// set the graph optimization level to all (used to be called level 3)
RETURN_HR_IF_NOT_OK_MSG(ort_api->SetSessionGraphOptimizationLevel(session_options.get(), GraphOptimizationLevel::ORT_ENABLE_ALL),
ort_api);
// Onnxruntime will use half the number of concurrent threads supported on the system
// by default. This causes MLAS to not exercise every logical core.
// We force the thread pool size to be maxxed out to ensure that WinML always
// runs the fastest.
RETURN_HR_IF_NOT_OK_MSG(ort_api->SetIntraOpNumThreads(session_options.get(), std::thread::hardware_concurrency()),
ort_api);
#ifndef _WIN64
auto use_arena = false;
#else
auto use_arena = true;
#endif
RETURN_HR_IF_NOT_OK_MSG(winml_adapter_api->OrtSessionOptionsAppendExecutionProvider_CPU(session_options.get(), use_arena),
ort_api);
// call release() so the underlying OrtSessionOptions object isn't freed
*options = session_options.release();
return S_OK;
}
HRESULT
OnnxruntimeCpuSessionBuilder::CreateSession(
OrtSessionOptions* options,
OrtSession** session) {
RETURN_HR_IF_NULL(E_POINTER, session);
auto ort_api = engine_factory_->UseOrtApi();
auto winml_adapter_api = engine_factory_->UseWinmlAdapterApi();
OrtEnv* ort_env;
RETURN_IF_FAILED(engine_factory_->GetOrtEnvironment(&ort_env));
OrtSession* ort_session_raw;
RETURN_HR_IF_NOT_OK_MSG(winml_adapter_api->CreateSessionWithoutModel(ort_env, options, &ort_session_raw),
engine_factory_->UseOrtApi());
auto ort_session = UniqueOrtSession(ort_session_raw, ort_api->ReleaseSession);
*session = ort_session.release();
return S_OK;
}
HRESULT
OnnxruntimeCpuSessionBuilder::Initialize(
OrtSession* session) {
RETURN_HR_IF_NULL(E_INVALIDARG, session);
auto winml_adapter_api = engine_factory_->UseWinmlAdapterApi();
RETURN_HR_IF_NOT_OK_MSG(winml_adapter_api->SessionInitialize(session),
engine_factory_->UseOrtApi());
return S_OK;
}