mirror of
https://github.com/saymrwulf/onnxruntime.git
synced 2026-05-25 22:26:24 +00:00
this is a big PR. we are going to move it up to layer_dev , which is still a L3 so we are still safe to do work there agile. we are going to move this into the L3 so that ryan can start doing intergration testing. we will pause for a full code review and integration test result prior to going into the L2. >>>> raw comments from previous commits >>> * LearningModelSession is cleaned up to use the adapter, and parts of binding are. * moved everything in the winmladapter made it all nano-com using, WRL to construct objects in the ORT side. base interfaces for everythign for winml to call cleaned up a bunch of winml to use the base interfaces. * more pieces * GetData across the abi. * renamed some namepsace cleaned up OrtValue cleaned up Tensor cleaned up custom ops. everything *but* learnignmodel should be clean * make sure it's building. winml.dll is still a monolith.
459 lines
No EOL
17 KiB
C++
459 lines
No EOL
17 KiB
C++
// Copyright (c) Microsoft Corporation.
|
|
// Licensed under the MIT License.
|
|
|
|
#include "pch.h"
|
|
#include "ConverterResourceStore.h"
|
|
#include "impl/FeatureCompatibility.h"
|
|
#include "FeatureValues.h"
|
|
#include "LearningModelBinding.h"
|
|
#include "LearningModelSession.h"
|
|
#include "TelemetryEvent.h"
|
|
|
|
using namespace WinML;
|
|
|
|
namespace winrt::Windows::AI::MachineLearning::implementation {
|
|
LearningModelBinding::LearningModelBinding(
|
|
Windows::AI::MachineLearning::LearningModelSession const& session) try : m_session(session) {
|
|
m_lotusBinding.attach(session.as<LearningModelSession>()->CreateSessionBinding());
|
|
WINML_THROW_IF_FAILED(OrtGetWinMLAdapter(adapter_.put()));
|
|
}
|
|
WINML_CATCH_ALL
|
|
|
|
static Windows::AI::MachineLearning::ILearningModelFeatureDescriptor FindValidBinding(
|
|
winrt::Windows::Foundation::Collections::IIterable<ILearningModelFeatureDescriptor> descriptors,
|
|
const std::wstring& name) {
|
|
for (auto descriptor : descriptors) {
|
|
auto descriptor_native = descriptor.as<ILearningModelFeatureDescriptorNative>();
|
|
|
|
const wchar_t* feature_name;
|
|
uint32_t size;
|
|
WINML_THROW_IF_FAILED(descriptor_native->GetName(&feature_name, &size));
|
|
|
|
// Case insensetive comparison of onnx name in feature descriptor, and passed in name
|
|
if (_wcsicmp(feature_name, name.c_str()) == 0) {
|
|
return descriptor;
|
|
}
|
|
}
|
|
return nullptr;
|
|
}
|
|
|
|
using NullableBindingPort = std::optional<std::pair<Windows::AI::MachineLearning::ILearningModelFeatureDescriptor, BindingType>>;
|
|
|
|
static NullableBindingPort FindValidBinding(
|
|
LearningModel model,
|
|
const std::wstring& name) {
|
|
if (auto descriptor = FindValidBinding(model.InputFeatures(), name)) {
|
|
return std::make_pair(descriptor, BindingType::kInput);
|
|
} else if (auto output_descriptor = FindValidBinding(model.OutputFeatures(), name)) {
|
|
return std::make_pair(output_descriptor, BindingType::kOutput);
|
|
}
|
|
|
|
return {};
|
|
}
|
|
|
|
void LearningModelBinding::CacheProvider(
|
|
std::string name,
|
|
ProviderInfo& providerInfo) {
|
|
m_providers[name] = providerInfo;
|
|
}
|
|
|
|
std::tuple<std::string, _winmla::IOrtValue*, BindingType> LearningModelBinding::CreateBinding(
|
|
const std::string& name,
|
|
const Windows::Foundation::IInspectable& inspectable,
|
|
Windows::Foundation::Collections::IPropertySet const& properties) {
|
|
// Given a known type, validate against the model
|
|
auto model = m_session.Model();
|
|
auto bindingPort = FindValidBinding(model, WinML::Strings::WStringFromString(name));
|
|
|
|
WINML_THROW_HR_IF_FALSE_MSG(
|
|
WINML_ERR_INVALID_BINDING,
|
|
bindingPort.has_value(),
|
|
"The model has no variable with name %s.",
|
|
name.c_str());
|
|
|
|
// Retrieve the descriptor and binding type
|
|
auto descriptor = bindingPort->first;
|
|
auto bindingType = bindingPort->second;
|
|
|
|
// Create a feature value from the iinspectable input
|
|
auto featureValue = WinML::CreateFeatureValueFromInspectable(bindingType, inspectable, descriptor);
|
|
WINML_THROW_HR_IF_NULL_MSG(
|
|
WINML_ERR_INVALID_BINDING,
|
|
featureValue,
|
|
"The model variable %s cannot be bound with the provided type.",
|
|
name.c_str());
|
|
|
|
// Validate that the feature value is compatible with the descriptor
|
|
WinML::VerifyFeatureValueCompatibleWithDescriptor(featureValue, descriptor);
|
|
|
|
// Create the Binding Context to pass to the feature value
|
|
BindingContext context{
|
|
bindingType,
|
|
m_session,
|
|
descriptor,
|
|
properties,
|
|
{} // SubresourceId is set by callee
|
|
};
|
|
|
|
// Get the bound tensor
|
|
winrt::com_ptr<_winmla::IOrtValue> value;
|
|
|
|
// Get the native ORT interface for the given bind value
|
|
auto spLotusValueProvider = featureValue.as<WinML::ILotusValueProviderPrivate>();
|
|
|
|
auto spSession = m_session.as<LearningModelSession>();
|
|
|
|
// Check if the feature value is a placeholder
|
|
bool isPlaceHolder;
|
|
WINML_THROW_IF_FAILED(spLotusValueProvider->IsPlaceholder(&isPlaceHolder));
|
|
|
|
// If binding a tensor for gpu execution, always bind.
|
|
// If it is a placeholder, gpu resources will be preallocated during bind.
|
|
// This enables the chaining scenario.
|
|
auto spDevice = m_session.Device().as<LearningModelDevice>();
|
|
auto isGpuSession = !spDevice->IsCpuDevice();
|
|
auto spTensor = featureValue.try_as<ITensor>();
|
|
auto isTensorWithShape = spTensor != nullptr && spTensor.Shape().Size() != 0;
|
|
auto shouldAlwaysTensorize = isTensorWithShape && isGpuSession;
|
|
|
|
if (!isPlaceHolder || shouldAlwaysTensorize) {
|
|
// If not a placeholder, attempt to get the underlying resource
|
|
WINML_THROW_IF_FAILED_MSG(
|
|
spLotusValueProvider->GetOrtValue(context, value.put()),
|
|
"The model variable %s failed tensorization.",
|
|
name.c_str());
|
|
} else {
|
|
WINML_THROW_HR_IF_TRUE_MSG(
|
|
WINML_ERR_INVALID_BINDING,
|
|
isPlaceHolder && bindingType == BindingType::kInput,
|
|
"The model variable %s is an input, but has no associated resources to bind.",
|
|
name.c_str());
|
|
}
|
|
|
|
// Hold onto the input output providers so that our memory doesnt get destroyed!
|
|
auto providerInfo = ProviderInfo{inspectable, spLotusValueProvider, context};
|
|
CacheProvider(name, providerInfo);
|
|
|
|
return std::make_tuple(name, value.detach(), bindingType);
|
|
}
|
|
|
|
void LearningModelBinding::Bind(
|
|
hstring const& name,
|
|
Windows::Foundation::IInspectable const& value) try {
|
|
return Bind(name, value, nullptr /* no properties */);
|
|
}
|
|
WINML_CATCH_ALL
|
|
|
|
void LearningModelBinding::Bind(
|
|
hstring const& name,
|
|
Windows::Foundation::IInspectable const& value,
|
|
Windows::Foundation::Collections::IPropertySet const& properties) try {
|
|
_winmlt::TelemetryEvent binding_event(_winmlt::EventCategory::kBinding);
|
|
|
|
BindingType bindingType;
|
|
std::string bindingName;
|
|
_winmla::IOrtValue* bindingValuePtr;
|
|
winrt::com_ptr<_winmla::IOrtValue> bindingValue;
|
|
|
|
auto featureName = WinML::Strings::UTF8FromHString(name);
|
|
std::tie(bindingName, bindingValuePtr, bindingType) = CreateBinding(featureName, value, properties);
|
|
bindingValue.attach(bindingValuePtr);
|
|
|
|
switch (bindingType) {
|
|
case BindingType::kInput:
|
|
WINML_THROW_IF_FAILED(m_lotusBinding->BindInput(bindingName, bindingValue.get()));
|
|
break;
|
|
case BindingType::kOutput:
|
|
WINML_THROW_IF_FAILED(m_lotusBinding->BindOutput(bindingName, bindingValue.get()));
|
|
break;
|
|
default:
|
|
FAIL_FAST();
|
|
}
|
|
}
|
|
WINML_CATCH_ALL
|
|
|
|
void LearningModelBinding::Clear() try {
|
|
m_lotusBinding.attach(m_session.as<LearningModelSession>()->CreateSessionBinding());
|
|
m_providers.clear();
|
|
}
|
|
WINML_CATCH_ALL
|
|
|
|
Windows::Foundation::Collections::IIterator<LearningModelBinding::KeyValuePair> LearningModelBinding::First() {
|
|
std::unordered_map<hstring, Windows::Foundation::IInspectable> bindingsMap;
|
|
|
|
for (auto mergedBindings : m_providers) {
|
|
auto name = WinML::Strings::HStringFromUTF8(mergedBindings.first);
|
|
bindingsMap[name] = mergedBindings.second.CallerSpecifiedFeatureValue;
|
|
}
|
|
|
|
return winrt::single_threaded_map(std::move(bindingsMap)).First();
|
|
}
|
|
|
|
Windows::Foundation::IInspectable LearningModelBinding::Lookup(hstring const& key) {
|
|
auto utf8Name = WinML::Strings::UTF8FromHString(key);
|
|
|
|
auto foundIt = m_providers.find(utf8Name);
|
|
WINML_THROW_HR_IF_FALSE_MSG(
|
|
E_BOUNDS,
|
|
foundIt != std::end(m_providers),
|
|
"The binding collection does not contain a variable with name %s.",
|
|
utf8Name.c_str());
|
|
|
|
auto providerInfo = foundIt->second;
|
|
return providerInfo.CallerSpecifiedFeatureValue;
|
|
}
|
|
|
|
uint32_t LearningModelBinding::Size() {
|
|
return static_cast<uint32_t>(m_providers.size());
|
|
}
|
|
|
|
bool LearningModelBinding::HasKey(hstring const& key) {
|
|
auto utf8Name = WinML::Strings::UTF8FromHString(key);
|
|
return m_providers.find(utf8Name) != m_providers.end();
|
|
}
|
|
|
|
void LearningModelBinding::Split(
|
|
Windows::Foundation::Collections::IMapView<hstring, Windows::Foundation::IInspectable>& first,
|
|
Windows::Foundation::Collections::IMapView<hstring, Windows::Foundation::IInspectable>& second) {
|
|
throw hresult_not_implemented();
|
|
}
|
|
|
|
_winmla::IIOBinding* LearningModelBinding::BindingCollection() {
|
|
_winmla::IIOBinding* p;
|
|
m_lotusBinding.copy_to(&p);
|
|
return p;
|
|
}
|
|
|
|
bool LearningModelBinding::IsOfMapType(_winmla::IOrtValue* mlValue, TensorKind key_kind, TensorKind value_kind) {
|
|
return mlValue->Type() == adapter_->GetMapType(key_kind, value_kind);
|
|
};
|
|
|
|
bool LearningModelBinding::IsOfVectorMapType(_winmla::IOrtValue* mlValue, TensorKind key_kind, TensorKind value_kind) {
|
|
return mlValue->Type() == adapter_->GetVectorMapType(key_kind, value_kind);
|
|
};
|
|
|
|
bool LearningModelBinding::IsOfTensorType(_winmla::ITensor* tensorValue, TensorKind kind) {
|
|
return tensorValue->DataType() == adapter_->GetTensorType(kind);
|
|
};
|
|
|
|
ILearningModelFeatureValue LearningModelBinding::CreateUnboundOuputFeatureValue(
|
|
_winmla::IOrtValue* mlValue,
|
|
ILearningModelFeatureDescriptor& descriptor) {
|
|
if (mlValue->IsTensor()) {
|
|
winrt::com_ptr<_winmla::ITensor> tensorValue;
|
|
mlValue->GetTensor(tensorValue.put());
|
|
|
|
if (IsOfTensorType(tensorValue.get(), TensorKind::Float)) {
|
|
if (descriptor.Kind() == LearningModelFeatureKind::Image) {
|
|
using namespace Windows::Graphics::Imaging;
|
|
// TODO: this format for unbound ouput needs more discussion
|
|
BitmapPixelFormat format = descriptor.as<ImageFeatureDescriptor>()->BitmapPixelFormat();
|
|
uint32_t width = static_cast<uint32_t>(tensorValue->ShapeGetDims()[3]);
|
|
uint32_t height = static_cast<uint32_t>(tensorValue->ShapeGetDims()[2]);
|
|
uint32_t batchSize = static_cast<uint32_t>(tensorValue->ShapeGetDims()[0]);
|
|
return implementation::ImageFeatureValue::Create(batchSize, format, width, height);
|
|
} else {
|
|
return implementation::TensorFloat::Create();
|
|
}
|
|
}
|
|
if (IsOfTensorType(tensorValue.get(), TensorKind::Double)) {
|
|
return implementation::TensorDouble::Create();
|
|
}
|
|
if (IsOfTensorType(tensorValue.get(), TensorKind::String)) {
|
|
return implementation::TensorString::Create();
|
|
}
|
|
if (IsOfTensorType(tensorValue.get(), TensorKind::UInt8)) {
|
|
return implementation::TensorUInt8Bit::Create();
|
|
}
|
|
if (IsOfTensorType(tensorValue.get(), TensorKind::Int8)) {
|
|
return implementation::TensorInt8Bit::Create();
|
|
}
|
|
if (IsOfTensorType(tensorValue.get(), TensorKind::UInt16)) {
|
|
return implementation::TensorUInt16Bit::Create();
|
|
}
|
|
if (IsOfTensorType(tensorValue.get(), TensorKind::Int16)) {
|
|
return implementation::TensorInt16Bit::Create();
|
|
}
|
|
if (IsOfTensorType(tensorValue.get(), TensorKind::UInt32)) {
|
|
return implementation::TensorUInt32Bit::Create();
|
|
}
|
|
if (IsOfTensorType(tensorValue.get(), TensorKind::Int32)) {
|
|
return implementation::TensorInt32Bit::Create();
|
|
}
|
|
if (IsOfTensorType(tensorValue.get(), TensorKind::UInt64)) {
|
|
return implementation::TensorUInt64Bit::Create();
|
|
}
|
|
if (IsOfTensorType(tensorValue.get(), TensorKind::Int64)) {
|
|
return implementation::TensorInt64Bit::Create();
|
|
}
|
|
if (IsOfTensorType(tensorValue.get(), TensorKind::Boolean)) {
|
|
return implementation::TensorBoolean::Create();
|
|
}
|
|
if (IsOfTensorType(tensorValue.get(), TensorKind::Float16)) {
|
|
return implementation::TensorFloat16Bit::Create();
|
|
}
|
|
}
|
|
// Maps
|
|
else if (IsOfMapType(mlValue, TensorKind::String, TensorKind::String)) {
|
|
return implementation::MapStringToString::Create();
|
|
} else if (IsOfMapType(mlValue, TensorKind::String, TensorKind::Int64)) {
|
|
return implementation::MapStringToInt64Bit::Create();
|
|
} else if (IsOfMapType(mlValue, TensorKind::String, TensorKind::Float)) {
|
|
return implementation::MapStringToFloat::Create();
|
|
} else if (IsOfMapType(mlValue, TensorKind::String, TensorKind::Double)) {
|
|
return implementation::MapStringToDouble::Create();
|
|
} else if (IsOfMapType(mlValue, TensorKind::Int64, TensorKind::String)) {
|
|
return implementation::MapInt64BitToString::Create();
|
|
} else if (IsOfMapType(mlValue, TensorKind::Int64, TensorKind::Int64)) {
|
|
return implementation::MapInt64BitToInt64Bit::Create();
|
|
} else if (IsOfMapType(mlValue, TensorKind::Int64, TensorKind::Float)) {
|
|
return implementation::MapInt64BitToFloat::Create();
|
|
} else if (IsOfMapType(mlValue, TensorKind::Int64, TensorKind::Double)) {
|
|
return implementation::MapInt64BitToDouble::Create();
|
|
}
|
|
// Sequences
|
|
else if (IsOfVectorMapType(mlValue, TensorKind::String, TensorKind::Float)) {
|
|
return implementation::SequenceMapStringFloat::Create();
|
|
} else if (IsOfVectorMapType(mlValue, TensorKind::Int64, TensorKind::Float)) {
|
|
return implementation::SequenceMapInt64BitFloat::Create();
|
|
}
|
|
|
|
auto utf8Name = WinML::Strings::UTF8FromHString(descriptor.Name());
|
|
WINML_THROW_HR_IF_TRUE_MSG(
|
|
E_UNEXPECTED,
|
|
true,
|
|
"The engine produced an unexpected evaluation output for unbound output variable %s.",
|
|
utf8Name.c_str());
|
|
|
|
return nullptr;
|
|
}
|
|
|
|
Windows::Foundation::IInspectable LearningModelBinding::CreateUnboundOutput(
|
|
const std::string& name,
|
|
_winmla::IOrtValue* mlValue) {
|
|
// Find valid binding port
|
|
auto bindingPort = FindValidBinding(
|
|
m_session.Model(),
|
|
WinML::Strings::WStringFromString(name));
|
|
|
|
WINML_THROW_HR_IF_FALSE_MSG(
|
|
E_UNEXPECTED,
|
|
bindingPort.has_value(),
|
|
"The engine produced an unexpected evaluation output %s, that is not a model variable.",
|
|
name.c_str());
|
|
|
|
// Retrieve the descriptor and binding type
|
|
auto descriptor = bindingPort->first;
|
|
auto bindingType = bindingPort->second;
|
|
WINML_THROW_HR_IF_FALSE_MSG(
|
|
E_UNEXPECTED,
|
|
bindingType == BindingType::kOutput,
|
|
"The engine produced an unexpected evaluation output %s, that is not a model variable output.",
|
|
name.c_str());
|
|
|
|
// Create a binding context
|
|
BindingContext context{
|
|
bindingType,
|
|
m_session,
|
|
descriptor,
|
|
nullptr /* no binding properties for unbound outputs */,
|
|
{} // SubresourceId is set by callee
|
|
};
|
|
|
|
// Create empty feature value
|
|
auto featureValue = CreateUnboundOuputFeatureValue(mlValue, descriptor);
|
|
|
|
// Update feature value
|
|
auto spLotusValueProvider = featureValue.as<WinML::ILotusValueProviderPrivate>();
|
|
WINML_THROW_IF_FAILED_MSG(
|
|
spLotusValueProvider->UpdateSourceResourceData(context, mlValue),
|
|
"Failed to update bound object for model variable output %s",
|
|
name.c_str());
|
|
|
|
// Get abi representation
|
|
winrt::Windows::Foundation::IInspectable inspectable;
|
|
WINML_THROW_IF_FAILED_MSG(
|
|
spLotusValueProvider->AbiRepresentation(inspectable),
|
|
"Failed to return bound object for model variable output %s",
|
|
name.c_str());
|
|
|
|
return inspectable;
|
|
}
|
|
|
|
std::unordered_map<std::string, Windows::Foundation::IInspectable> LearningModelBinding::UpdateProviders() {
|
|
std::unordered_map<std::string, Windows::Foundation::IInspectable> outputs;
|
|
|
|
auto& outputNames = m_lotusBinding->GetOutputNames();
|
|
auto& outputMLValues = m_lotusBinding->GetOutputs();
|
|
WINML_THROW_HR_IF_FALSE_MSG(
|
|
E_UNEXPECTED,
|
|
outputNames.size() == outputMLValues.size(),
|
|
"Evaluation produced unexpected output variables.");
|
|
|
|
for (unsigned i = 0; i < outputNames.size(); i++) {
|
|
auto utf8Name = outputNames[i];
|
|
auto mlValue = outputMLValues[i];
|
|
|
|
if (m_providers.find(utf8Name) != std::end(m_providers)) {
|
|
auto& providerInfo = m_providers[utf8Name];
|
|
auto provider = providerInfo.Provider;
|
|
auto context = providerInfo.Context;
|
|
WINML_THROW_IF_FAILED_MSG(
|
|
provider->UpdateSourceResourceData(context, mlValue),
|
|
"Failed to update bound object for model variable output %s",
|
|
utf8Name.c_str());
|
|
|
|
outputs[utf8Name] = providerInfo.CallerSpecifiedFeatureValue;
|
|
} else {
|
|
// unbound outputs
|
|
outputs[utf8Name] = CreateUnboundOutput(utf8Name, mlValue);
|
|
}
|
|
}
|
|
|
|
// Clear any converters cached on inputs to return them to the pool
|
|
for (auto&& provider : m_providers) {
|
|
if (provider.second.Context.converter != nullptr) {
|
|
provider.second.Context.converter->Get()->Tensorizer->ResetAllocator();
|
|
provider.second.Context.converter = nullptr;
|
|
}
|
|
}
|
|
|
|
return outputs;
|
|
}
|
|
|
|
STDMETHODIMP LearningModelBinding::Bind(
|
|
const wchar_t* name,
|
|
UINT32 cchName,
|
|
IUnknown* value) {
|
|
try {
|
|
_winmlt::TelemetryEvent binding_event(_winmlt::EventCategory::kBinding);
|
|
|
|
BindingType bindingType;
|
|
std::string bindingName;
|
|
_winmla::IOrtValue* bindingValuePtr;
|
|
winrt::com_ptr<_winmla::IOrtValue> bindingValue;
|
|
|
|
winrt::Windows::Foundation::IInspectable to;
|
|
RETURN_IF_FAILED(value->QueryInterface(
|
|
winrt::guid_of<winrt::Windows::Foundation::IInspectable>(),
|
|
reinterpret_cast<void**>(winrt::put_abi(to))));
|
|
|
|
auto featureName = WinML::Strings::UTF8FromUnicode(name, cchName);
|
|
std::tie(bindingName, bindingValuePtr, bindingType) = CreateBinding(featureName, to, nullptr);
|
|
bindingValue.attach(bindingValuePtr);
|
|
|
|
switch (bindingType) {
|
|
case BindingType::kInput:
|
|
WINML_THROW_IF_FAILED(m_lotusBinding->BindInput(bindingName, bindingValue.get()));
|
|
break;
|
|
case BindingType::kOutput:
|
|
WINML_THROW_IF_FAILED(m_lotusBinding->BindOutput(bindingName, bindingValue.get()));
|
|
break;
|
|
default:
|
|
FAIL_FAST();
|
|
}
|
|
return S_OK;
|
|
}
|
|
WINML_CATCH_ALL_COM
|
|
}
|
|
} // namespace winrt::Windows::AI::MachineLearning::implementation
|