onnxruntime/csharp/src/Microsoft.ML.OnnxRuntime/OrtAllocator.shared.cs
Dmitri Smirnov bd4d011142
[C#] Rename unreleased API, add utilities (#16806)
### Description
1. rename OrtValue.FillStringTensorElement to StringTensorSetElementAt .
To the API user I think we're conceptually setting the string at an
offset in the tensor with is roughly equivalent to `List<string> list
... list[index] = "value"`.
2. While working on new inference examples, I noticed that I am still
inclined to use `DenseTensor` for N-D indexing. Added `GetStrides()` and
`GetIndex()` from strides for long dims, so the user can obtain strides
and translate N-D indices into a flat index to operate directly on the
native `OrtValue` buffers. Expose these functions to the user.
3. Make sure we generate docs for C# public static  functions.
2023-08-02 10:06:42 -07:00

581 lines
23 KiB
C#

// Copyright (c) Microsoft Corporation. All rights reserved.
// Licensed under the MIT License.
using Microsoft.ML.OnnxRuntime.Tensors;
using System;
using System.Runtime.InteropServices;
using System.Text;
namespace Microsoft.ML.OnnxRuntime
{
/// <summary>
/// See documentation for OrtAllocatorType in C API
/// </summary>
public enum OrtAllocatorType
{
DeviceAllocator = 0, // Device specific allocator
ArenaAllocator = 1 // Memory arena
}
/// <summary>
/// See documentation for OrtMemType in C API
/// </summary>
public enum OrtMemType
{
CpuInput = -2, // Any CPU memory used by non-CPU execution provider
CpuOutput = -1, // CPU accessible memory outputted by non-CPU execution provider, i.e. CUDA_PINNED
Cpu = CpuOutput, // temporary CPU accessible memory allocated by non-CPU execution provider, i.e. CUDA_PINNED
Default = 0, // the default allocator for execution provider
}
/// <summary>
/// This class encapsulates arena configuration information that will be used to define the behavior
/// of an arena based allocator
/// See docs/C_API.md for more details
/// </summary>
public class OrtArenaCfg : SafeHandle
{
/// <summary>
/// Create an instance of arena configuration which will be used to create an arena based allocator
/// See docs/C_API.md for details on what the following parameters mean and how to choose these values
/// </summary>
/// <param name="maxMemory">Maximum amount of memory the arena allocates</param>
/// <param name="arenaExtendStrategy">Strategy for arena expansion</param>
/// <param name="initialChunkSizeBytes">Size of the region that the arena allocates first</param>
/// <param name="maxDeadBytesPerChunk">Maximum amount of fragmentation allowed per chunk</param>
public OrtArenaCfg(uint maxMemory, int arenaExtendStrategy, int initialChunkSizeBytes, int maxDeadBytesPerChunk)
: base(IntPtr.Zero, true)
{
NativeApiStatus.VerifySuccess(NativeMethods.OrtCreateArenaCfg((UIntPtr)maxMemory,
arenaExtendStrategy,
initialChunkSizeBytes,
maxDeadBytesPerChunk,
out handle));
}
internal IntPtr Pointer
{
get
{
return handle;
}
}
#region SafeHandle
/// <summary>
/// Overrides SafeHandle.IsInvalid
/// </summary>
/// <value>returns true if handle is equal to Zero</value>
public override bool IsInvalid { get { return handle == IntPtr.Zero; } }
/// <summary>
/// Overrides SafeHandle.ReleaseHandle() to properly dispose of
/// the native instance of OrtEnv
/// </summary>
/// <returns>always returns true</returns>
protected override bool ReleaseHandle()
{
NativeMethods.OrtReleaseArenaCfg(handle);
handle = IntPtr.Zero;
return true;
}
#endregion
}
/// <summary>
/// This class encapsulates and most of the time owns the underlying native OrtMemoryInfo instance.
/// Instance returned from OrtAllocator will not own OrtMemoryInfo, the class must be disposed
/// regardless.
///
/// Use this class to query and create OrtAllocator instances so you can pre-allocate memory for model
/// inputs/outputs and use it for binding. Instances of the class can also used to created OrtValues bound
/// to pre-allocated memory. In that case, the instance of OrtMemoryInfo contains the information about the allocator
/// used to allocate the underlying memory.
/// </summary>
public class OrtMemoryInfo : SafeHandle
{
private static readonly Lazy<OrtMemoryInfo> _defaultCpuAllocInfo = new Lazy<OrtMemoryInfo>(CreateCpuMemoryInfo);
private readonly bool _owned; // false if we are exposing OrtMemoryInfo from an allocator which owns it
private static OrtMemoryInfo CreateCpuMemoryInfo()
{
// Returns OrtMemoryInfo instance that needs to be disposed
NativeApiStatus.VerifySuccess(NativeMethods.OrtCreateCpuMemoryInfo(OrtAllocatorType.DeviceAllocator, OrtMemType.Cpu, out IntPtr memoryInfo));
return new OrtMemoryInfo(memoryInfo, true);
}
/// <summary>
/// Default CPU based instance
/// </summary>
/// <value>Singleton instance of a CpuMemoryInfo</value>
public static OrtMemoryInfo DefaultInstance
{
get
{
return _defaultCpuAllocInfo.Value;
}
}
internal IntPtr Pointer
{
get
{
return handle;
}
}
/// <summary>
/// Overrides SafeHandle.IsInvalid
/// </summary>
/// <value>returns true if handle is equal to Zero</value>
public override bool IsInvalid { get { return handle == IntPtr.Zero; } }
/// <summary>
/// This allocator takes an native pointer to already existing
/// instance of OrtMemoryInfo. That instance may either be owned or not
/// owned. In the latter case, this class serves to expose native properties
/// of the instance.
/// </summary>
/// <param name="allocInfo"></param>
internal OrtMemoryInfo(IntPtr allocInfo, bool owned)
: base(allocInfo, true)
{
_owned = owned;
}
/// <summary>
/// Predefined utf8 encoded allocator names. Use them to construct an instance of
/// OrtMemoryInfo to avoid UTF-16 to UTF-8 conversion costs.
/// </summary>
public static readonly byte[] allocatorCPU = Encoding.UTF8.GetBytes("Cpu" + Char.MinValue);
/// <summary>
/// Predefined utf8 encoded allocator names. Use them to construct an instance of
/// OrtMemoryInfo to avoid UTF-16 to UTF-8 conversion costs.
/// </summary>
public static readonly byte[] allocatorCUDA = Encoding.UTF8.GetBytes("Cuda" + Char.MinValue);
/// <summary>
/// Predefined utf8 encoded allocator names. Use them to construct an instance of
/// OrtMemoryInfo to avoid UTF-16 to UTF-8 conversion costs.
/// </summary>
public static readonly byte[] allocatorCUDA_PINNED = Encoding.UTF8.GetBytes("CudaPinned" + Char.MinValue);
/// <summary>
/// Predefined utf8 encoded allocator names. Use them to construct an instance of
/// OrtMemoryInfo to avoid UTF-16 to UTF-8 conversion costs.
/// </summary>
public static readonly byte[] allocatorHIP = Encoding.UTF8.GetBytes("Hip" + Char.MinValue);
/// <summary>
/// Predefined utf8 encoded allocator names. Use them to construct an instance of
/// OrtMemoryInfo to avoid UTF-16 to UTF-8 conversion costs.
/// </summary>
public static readonly byte[] allocatorHIP_PINNED = Encoding.UTF8.GetBytes("HipPinned" + Char.MinValue);
/// <summary>
/// Create an instance of OrtMemoryInfo according to the specification
/// Memory info instances are usually used to get a handle of a native allocator
/// that is present within the current inference session object. That, in turn, depends
/// of what execution providers are available within the binary that you are using and are
/// registered with Add methods.
/// </summary>
/// <param name="utf8AllocatorName">Allocator name. Use of the predefined above.</param>
/// <param name="allocatorType">Allocator type</param>
/// <param name="deviceId">Device id</param>
/// <param name="memoryType">Memory type</param>
public OrtMemoryInfo(byte[] utf8AllocatorName, OrtAllocatorType allocatorType, int deviceId, OrtMemType memoryType)
: base(IntPtr.Zero, true)
{
NativeApiStatus.VerifySuccess(NativeMethods.OrtCreateMemoryInfo(utf8AllocatorName,
allocatorType,
deviceId,
memoryType,
out handle));
_owned = true;
}
/// <summary>
/// Create an instance of OrtMemoryInfo according to the specification.
/// </summary>
/// <param name="allocatorName">Allocator name</param>
/// <param name="allocatorType">Allocator type</param>
/// <param name="deviceId">Device id</param>
/// <param name="memoryType">Memory type</param>
public OrtMemoryInfo(string allocatorName, OrtAllocatorType allocatorType, int deviceId, OrtMemType memoryType)
: this(NativeOnnxValueHelper.StringToZeroTerminatedUtf8(allocatorName), allocatorType, deviceId, memoryType)
{
}
/// <summary>
/// Name of the allocator associated with the OrtMemoryInfo instance
/// </summary>
public string Name
{
get
{
NativeApiStatus.VerifySuccess(NativeMethods.OrtMemoryInfoGetName(handle, out IntPtr utf8Name));
return NativeOnnxValueHelper.StringFromNativeUtf8(utf8Name);
}
}
/// <summary>
/// Returns device ID
/// </summary>
/// <value>returns integer Id value</value>
public int Id
{
get
{
NativeApiStatus.VerifySuccess(NativeMethods.OrtMemoryInfoGetId(handle, out int id));
return id;
}
}
/// <summary>
/// The below 2 are really properties but naming them is a challenge
/// as names would conflict with the returned type. Also, there are native
/// calls behind them so exposing them as Get() would be appropriate.
/// </summary>
/// <returns>OrtMemoryType for the instance</returns>
public OrtMemType GetMemoryType()
{
NativeApiStatus.VerifySuccess(NativeMethods.OrtMemoryInfoGetMemType(handle, out OrtMemType memoryType));
return memoryType;
}
/// <summary>
/// Fetches allocator type from the underlying OrtAllocator
/// </summary>
/// <returns>Returns allocator type</returns>
public OrtAllocatorType GetAllocatorType()
{
NativeApiStatus.VerifySuccess(NativeMethods.OrtMemoryInfoGetType(handle, out OrtAllocatorType allocatorType));
return allocatorType;
}
/// <summary>
/// Overrides System.Object.Equals(object)
/// </summary>
/// <param name="obj">object to compare to</param>
/// <returns>true if obj is an instance of OrtMemoryInfo and is equal to this</returns>
public override bool Equals(object obj)
{
if (!(obj is OrtMemoryInfo other))
{
return false;
}
return Equals(other);
}
/// <summary>
/// Compares this instance with another
/// </summary>
/// <param name="other">OrtMemoryInfo to compare to</param>
/// <returns>true if instances are equal according to OrtCompareMemoryInfo.</returns>
public bool Equals(OrtMemoryInfo other)
{
if (this == other)
{
return true;
}
NativeApiStatus.VerifySuccess(NativeMethods.OrtCompareMemoryInfo(handle, other.Pointer, out int result));
return (result == 0);
}
/// <summary>
/// Overrides System.Object.GetHashCode()
/// </summary>
/// <returns>integer hash value</returns>
public override int GetHashCode()
{
return Pointer.ToInt32();
}
#region SafeHandle
/// <summary>
/// Overrides SafeHandle.ReleaseHandle() to properly dispose of
/// the native instance of OrtMmeoryInfo
/// </summary>
/// <returns>always returns true</returns>
protected override bool ReleaseHandle()
{
// If this instance exposes OrtMemoryInfo that belongs
// to the allocator then the allocator owns it
if (_owned)
{
NativeMethods.OrtReleaseMemoryInfo(handle);
}
handle = IntPtr.Zero;
return true;
}
#endregion
}
/// <summary>
/// This class represents an arbitrary buffer of memory
/// allocated and owned by the user. It can be either a CPU, GPU or other device memory
/// that can be suitably represented by IntPtr.
/// This is just a composite of the buffer related information.
/// The memory is assumed to be pinned if necessary and usable immediately
/// in the native code.
/// </summary>
[Obsolete("Create OrtValue over an arbitrary piece of memory and use it where appropriate.")]
public class OrtExternalAllocation
{
/// <summary>
/// Constructor
/// </summary>
/// <param name="memInfo">use to accurately describe a piece of memory that this is wrapping</param>
/// <param name="shape">shape of this buffer</param>
/// <param name="elementType">element type</param>
/// <param name="pointer">the actual pointer to memory</param>
/// <param name="sizeInBytes">size of the allocation in bytes</param>
public OrtExternalAllocation(OrtMemoryInfo memInfo, long[] shape, Tensors.TensorElementType elementType, IntPtr pointer, long sizeInBytes)
{
var typeInfo = TensorBase.GetElementTypeInfo(elementType) ?? throw new OnnxRuntimeException(ErrorCode.InvalidArgument,
$"Tensor element type: {elementType} is not supported");
if (typeInfo.IsString)
{
throw new OnnxRuntimeException(ErrorCode.InvalidArgument,
"Strings are not supported by this API");
}
var shapeSize = ShapeUtils.GetSizeForShape(shape);
var requiredBufferSize = shapeSize * typeInfo.TypeSize;
if (requiredBufferSize > sizeInBytes)
{
var message = String.Format("Shape of {0} elements requires a buffer of at least {1} bytes. Provided: {2} bytes",
shapeSize, requiredBufferSize, sizeInBytes);
throw new OnnxRuntimeException(ErrorCode.InvalidArgument, message);
}
Info = memInfo;
Shape = shape;
ElementType = elementType;
Pointer = pointer;
Size = sizeInBytes;
}
/// <summary>
/// OrtMemoryInfo
/// </summary>
public OrtMemoryInfo Info { get; private set; }
/// <summary>
/// Shape
/// </summary>
public long[] Shape { get; private set; }
/// <summary>
/// Data type
/// </summary>
public Tensors.TensorElementType ElementType { get; private set; }
/// <summary>
/// Actual memory ptr
/// </summary>
public IntPtr Pointer { get; private set; }
/// <summary>
/// Size of the allocation in bytes
/// </summary>
public long Size { get; private set; }
}
/// <summary>
/// This class represents memory allocation made by a specific onnxruntime
/// allocator. Use OrtAllocator.Allocate() to obtain an instance of this class.
/// It implements IDisposable and makes use of the original allocator
/// used to allocate the memory. The lifespan of the allocator instance must eclipse the
/// lifespan of the allocation. Or, if you prefer, all OrtMemoryAllocation instances must be
/// disposed of before the corresponding allocator instances are disposed of.
/// </summary>
public class OrtMemoryAllocation : SafeHandle
{
// This allocator is used to free this allocation
// This also prevents OrtAllocator GC/finalization in case
// the user forgets to Dispose() of this allocation
private OrtAllocator _allocator;
/// <summary>
/// This constructs an instance representing an native memory allocation.
/// Typically returned by OrtAllocator.Allocate(). However, some APIs return
/// natively allocated IntPtr using a specific allocator. It is a good practice
/// to wrap such a memory into OrtAllocation for proper disposal. You can set
/// size to zero if not known, which is not important for disposing.
/// </summary>
/// <param name="allocator"></param>
/// <param name="pointer"></param>
/// <param name="size"></param>
internal OrtMemoryAllocation(OrtAllocator allocator, IntPtr pointer, uint size)
: base(pointer, true)
{
_allocator = allocator;
Size = size;
}
/// <summary>
/// Internal accessor to call native methods
/// </summary>
internal IntPtr Pointer { get { return handle; } }
/// <summary>
/// Overrides SafeHandle.IsInvalid
/// </summary>
/// <value>returns true if handle is equal to Zero</value>
public override bool IsInvalid { get { return handle == IntPtr.Zero; } }
/// <summary>
/// Size of the allocation
/// </summary>
/// <value>uint size of the allocation in bytes</value>
public uint Size { get; private set; }
/// <summary>
/// Memory Information about this allocation
/// </summary>
/// <value>Returns OrtMemoryInfo from the allocator</value>
public OrtMemoryInfo Info
{
get
{
return _allocator.Info;
}
}
#region SafeHandle
/// <summary>
/// Overrides SafeHandle.ReleaseHandle() to deallocate
/// a chunk of memory using the specified allocator.
/// </summary>
/// <returns>always returns true</returns>
protected override bool ReleaseHandle()
{
_allocator.FreeMemory(handle);
handle = IntPtr.Zero;
return true;
}
#endregion
}
/// <summary>
/// The class exposes native internal allocator for Onnxruntime.
/// This allocator enables you to allocate memory from the internal
/// memory pools including device allocations. Useful for binding.
/// </summary>
public class OrtAllocator : SafeHandle
{
private static readonly Lazy<OrtAllocator> _defaultInstance = new Lazy<OrtAllocator>(GetDefaultCpuAllocator);
private readonly bool _owned;
private static OrtAllocator GetDefaultCpuAllocator()
{
NativeApiStatus.VerifySuccess(NativeMethods.OrtGetAllocatorWithDefaultOptions(out IntPtr allocator));
// Instance of default cpu allocator is a native singleton
// Do not dispose of
return new OrtAllocator(allocator, false);
}
/// <summary>
/// Default CPU allocator instance
/// </summary>
public static OrtAllocator DefaultInstance // May throw exception in every access, if the constructor have thrown an exception
{
get
{
return _defaultInstance.Value;
}
}
internal IntPtr Pointer
{
get
{
return handle;
}
}
/// <summary>
/// Overrides SafeHandle.IsInvalid
/// </summary>
/// <value>returns true if handle is equal to Zero</value>
public override bool IsInvalid { get { return handle == IntPtr.Zero; } }
/// <summary>
/// Internal constructor wraps existing native allocators
/// </summary>
/// <param name="allocator"></param>
/// <param name="owned"></param>
internal OrtAllocator(IntPtr allocator, bool owned)
: base(allocator, true)
{
_owned = owned;
}
/// <summary>
/// Creates an instance of OrtAllocator according to the specifications in OrtMemorInfo.
/// The requested allocator should be available within the given session instance. This means
/// both, the native library was build with specific allocators (for instance CUDA) and the corresponding
/// provider was added to SessionsOptions before instantiating the session object.
/// </summary>
/// <param name="session"></param>
/// <param name="memInfo"></param>
public OrtAllocator(InferenceSession session, OrtMemoryInfo memInfo)
: base(IntPtr.Zero, true)
{
NativeApiStatus.VerifySuccess(NativeMethods.OrtCreateAllocator(session.Handle, memInfo.Pointer, out handle));
_owned = true;
}
/// <summary>
/// OrtMemoryInfo instance owned by the allocator
/// </summary>
/// <value>Instance of OrtMemoryInfo describing this allocator</value>
public OrtMemoryInfo Info
{
get
{
NativeApiStatus.VerifySuccess(NativeMethods.OrtAllocatorGetInfo(handle, out IntPtr memoryInfo));
// This serves as an exposure of memory_info owned by the allocator
return new OrtMemoryInfo(memoryInfo, false);
}
}
/// <summary>
/// Allocate native memory. Returns a disposable instance of OrtMemoryAllocation
/// </summary>
/// <param name="size">number of bytes to allocate</param>
/// <returns>Instance of OrtMemoryAllocation</returns>
public OrtMemoryAllocation Allocate(uint size)
{
NativeApiStatus.VerifySuccess(NativeMethods.OrtAllocatorAlloc(handle, (UIntPtr)size, out IntPtr allocation));
return new OrtMemoryAllocation(this, allocation, size);
}
/// <summary>
/// This internal interface is used for freeing memory.
/// </summary>
/// <param name="allocation">pointer to a native memory chunk allocated by this allocator instance</param>
internal void FreeMemory(IntPtr allocation)
{
NativeApiStatus.VerifySuccess(NativeMethods.OrtAllocatorFree(handle, allocation));
}
#region SafeHandle
/// <summary>
/// Overrides SafeHandle.ReleaseHandle() to properly dispose of
/// the native instance of OrtAllocator
/// </summary>
/// <returns>always returns true</returns>
protected override bool ReleaseHandle()
{
// Singleton default allocator is not owned
if (_owned)
{
NativeMethods.OrtReleaseAllocator(handle);
}
handle = IntPtr.Zero;
return true;
}
#endregion
}
}