ONNX Runtime
Loading...
Searching...
No Matches
onnxruntime_cxx_api.h
1// Copyright (c) Microsoft Corporation. All rights reserved.
2// Licensed under the MIT License.
3
4// Summary: The Ort C++ API is a header only wrapper around the Ort C API.
5//
6// The C++ API simplifies usage by returning values directly instead of error codes, throwing exceptions on errors
7// and automatically releasing resources in the destructors. The primary purpose of C++ API is exception safety so
8// all the resources follow RAII and do not leak memory.
9//
10// Each of the C++ wrapper classes holds only a pointer to the C internal object. Treat them like smart pointers.
11// To create an empty object, pass 'nullptr' to the constructor (for example, Env e{nullptr};). However, you can't use them
12// until you assign an instance that actually holds an underlying object.
13//
14// For Ort objects only move assignment between objects is allowed, there are no copy constructors.
15// Some objects have explicit 'Clone' methods for this purpose.
16//
17// ConstXXXX types are copyable since they do not own the underlying C object, so you can pass them to functions as arguments
18// by value or by reference. ConstXXXX types are restricted to const only interfaces.
19//
20// UnownedXXXX are similar to ConstXXXX but also allow non-const interfaces.
21//
22// The lifetime of the corresponding owning object must eclipse the lifetimes of the ConstXXXX/UnownedXXXX types. They exists so you do not
23// have to fallback to C types and the API with the usual pitfalls. In general, do not use C API from your C++ code.
24
25#pragma once
26#include "onnxruntime_c_api.h"
27#include "onnxruntime_float16.h"
28
29#include <array>
30#include <cstddef>
31#include <cstdio>
32#include <memory>
33#include <stdexcept>
34#include <string>
35#include <type_traits>
36#include <unordered_map>
37#include <utility>
38#include <variant>
39#include <vector>
40
41#ifdef ORT_NO_EXCEPTIONS
42#include <iostream>
43#endif
44
48namespace Ort {
49
54struct Exception : std::exception {
55 Exception(const std::string& string, OrtErrorCode code) : message_{string}, code_{code} {}
56 Exception(std::string&& string, OrtErrorCode code) : message_{std::move(string)}, code_{code} {}
57
58 OrtErrorCode GetOrtErrorCode() const { return code_; }
59 const char* what() const noexcept override { return message_.c_str(); }
60
61 private:
62 std::string message_;
63 OrtErrorCode code_;
64};
65
66#ifdef ORT_NO_EXCEPTIONS
67// The #ifndef is for the very special case where the user of this library wants to define their own way of handling errors.
68// NOTE: This header expects control flow to not continue after calling ORT_CXX_API_THROW
69#ifndef ORT_CXX_API_THROW
70#define ORT_CXX_API_THROW(string, code) \
71 do { \
72 std::cerr << Ort::Exception(string, code) \
73 .what() \
74 << std::endl; \
75 abort(); \
76 } while (false)
77#endif
78#else
79#define ORT_CXX_API_THROW(string, code) \
80 throw Ort::Exception(string, code)
81#endif
82
83#ifdef ORT_API_MANUAL_INIT
84// If the macro ORT_API_MANUAL_INIT is defined, no static initialization
85// will be performed. Instead, users must call InitApi() before using the
86// ORT C++ APIs..
87//
88// InitApi() sets the global API object using the default initialization
89// logic. Users call this to initialize the ORT C++ APIs at a time that
90// makes sense in their program.
91inline void InitApi() noexcept;
92
93// InitApi(const OrtApi*) is used by custom operator libraries that are not
94// linked to onnxruntime. It sets the global API object, which is required
95// by the ORT C++ APIs.
96//
97// Example mycustomop.cc:
98//
99// #define ORT_API_MANUAL_INIT
100// #include <onnxruntime_cxx_api.h>
101// #undef ORT_API_MANUAL_INIT
102//
103// OrtStatus* ORT_API_CALL RegisterCustomOps(OrtSessionOptions* options, const OrtApiBase* api_base) {
104// Ort::InitApi(api_base->GetApi(ORT_API_VERSION));
105// // ...
106// }
107//
108inline void InitApi(const OrtApi* api) noexcept;
109#endif
110
111namespace detail {
112// This is used internally by the C++ API. This class holds the global
113// variable that points to the OrtApi.
114struct Global {
115 static const OrtApi* Api(const OrtApi* newValue = nullptr) noexcept {
116 // This block-level static will be initialized once when this function is
117 // first executed, delaying the call to DefaultInit() until it is first needed.
118 //
119 // When ORT_API_MANUAL_INIT is not defined, DefaultInit() calls
120 // OrtGetApiBase()->GetApi(), which may result in a shared library being
121 // loaded.
122 //
123 // Using a block-level static instead of a class-level static helps
124 // avoid issues with static initialization order and dynamic libraries
125 // loading other dynamic libraries.
126 //
127 // This makes it safe to include the C++ API headers in a shared library
128 // that is delay loaded or delay loads its dependencies.
129 //
130 // This DOES NOT make it safe to _use_ arbitrary ORT C++ APIs when
131 // initializing static members, however.
132 static const OrtApi* api = DefaultInit();
133
134 if (newValue) {
135 api = newValue;
136 }
137
138 return api;
139 }
140
141 private:
142 // Has different definitions based on ORT_API_MANUAL_INIT
143 static const OrtApi* DefaultInit() noexcept;
144
145#ifdef ORT_API_MANUAL_INIT
146 // Public APIs to set the OrtApi* to use.
147 friend void ::Ort::InitApi() noexcept;
148 friend void ::Ort::InitApi(const OrtApi*) noexcept;
149#endif
150};
151} // namespace detail
152
153#ifdef ORT_API_MANUAL_INIT
154
155// See comments on declaration above for usage.
156inline void InitApi(const OrtApi* api) noexcept { detail::Global::Api(api); }
157inline void InitApi() noexcept { InitApi(OrtGetApiBase()->GetApi(ORT_API_VERSION)); }
158
159#ifdef _MSC_VER
160// If you get a linker error about a mismatch here, you are trying to
161// link two compilation units that have different definitions for
162// ORT_API_MANUAL_INIT together. All compilation units must agree on the
163// definition of ORT_API_MANUAL_INIT.
164#pragma detect_mismatch("ORT_API_MANUAL_INIT", "enabled")
165#endif
166
167inline const OrtApi* detail::Global::DefaultInit() noexcept {
168 // When ORT_API_MANUAL_INIT is defined, there's no default init that can
169 // be done.
170 return nullptr;
171}
172
173#else // ORT_API_MANUAL_INIT
174
175#ifdef _MSC_VER
176// If you get a linker error about a mismatch here, you are trying to link
177// two compilation units that have different definitions for
178// ORT_API_MANUAL_INIT together. All compilation units must agree on the
179// definition of ORT_API_MANUAL_INIT.
180#pragma detect_mismatch("ORT_API_MANUAL_INIT", "disabled")
181#endif
182
183inline const OrtApi* detail::Global::DefaultInit() noexcept {
185}
186#endif // ORT_API_MANUAL_INIT
187
189inline const OrtApi& GetApi() noexcept { return *detail::Global::Api(); }
190
195std::string GetVersionString();
196
202std::string GetBuildInfoString();
203
209std::vector<std::string> GetAvailableProviders();
210
216 auto* api = GetApi().GetModelEditorApi();
217 if (api == nullptr) {
218 // minimal build
219 ORT_CXX_API_THROW("Model Editor API is not available in this build", ORT_FAIL);
220 }
221
222 return *api;
223}
224
230 auto* api = GetApi().GetCompileApi();
231 if (api == nullptr) {
232 // minimal build
233 ORT_CXX_API_THROW("Compile API is not available in this build", ORT_FAIL);
234 }
235
236 return *api;
237}
238
243inline const OrtEpApi& GetEpApi() {
244 auto* api = GetApi().GetEpApi();
245 if (api == nullptr) {
246 // minimal build
247 ORT_CXX_API_THROW("EP API is not available in this build", ORT_FAIL);
248 }
249
250 return *api;
251}
252
271struct Float16_t : onnxruntime_float16::Float16Impl<Float16_t> {
272 private:
278 constexpr explicit Float16_t(uint16_t v) noexcept { val = v; }
279
280 public:
281 using Base = onnxruntime_float16::Float16Impl<Float16_t>;
282
286 Float16_t() = default;
287
293 constexpr static Float16_t FromBits(uint16_t v) noexcept { return Float16_t(v); }
294
299 explicit Float16_t(float v) noexcept { val = Base::ToUint16Impl(v); }
300
305 float ToFloat() const noexcept { return Base::ToFloatImpl(); }
306
311 using Base::IsNegative;
312
317 using Base::IsNaN;
318
323 using Base::IsFinite;
324
329 using Base::IsPositiveInfinity;
330
335 using Base::IsNegativeInfinity;
336
341 using Base::IsInfinity;
342
347 using Base::IsNaNOrZero;
348
353 using Base::IsNormal;
354
359 using Base::IsSubnormal;
360
365 using Base::Abs;
366
371 using Base::Negate;
372
381 using Base::AreZero;
382
386 explicit operator float() const noexcept { return ToFloat(); }
387
388 using Base::operator==;
389 using Base::operator!=;
390 using Base::operator<;
391};
392
393static_assert(sizeof(Float16_t) == sizeof(uint16_t), "Sizes must match");
394
413struct BFloat16_t : onnxruntime_float16::BFloat16Impl<BFloat16_t> {
414 private:
422 constexpr explicit BFloat16_t(uint16_t v) noexcept { val = v; }
423
424 public:
425 using Base = onnxruntime_float16::BFloat16Impl<BFloat16_t>;
426
427 BFloat16_t() = default;
428
434 static constexpr BFloat16_t FromBits(uint16_t v) noexcept { return BFloat16_t(v); }
435
440 explicit BFloat16_t(float v) noexcept { val = Base::ToUint16Impl(v); }
441
446 float ToFloat() const noexcept { return Base::ToFloatImpl(); }
447
452 using Base::IsNegative;
453
458 using Base::IsNaN;
459
464 using Base::IsFinite;
465
470 using Base::IsPositiveInfinity;
471
476 using Base::IsNegativeInfinity;
477
482 using Base::IsInfinity;
483
488 using Base::IsNaNOrZero;
489
494 using Base::IsNormal;
495
500 using Base::IsSubnormal;
501
506 using Base::Abs;
507
512 using Base::Negate;
513
522 using Base::AreZero;
523
527 explicit operator float() const noexcept { return ToFloat(); }
528
529 // We do not have an inherited impl for the below operators
530 // as the internal class implements them a little differently
531 bool operator==(const BFloat16_t& rhs) const noexcept;
532 bool operator!=(const BFloat16_t& rhs) const noexcept { return !(*this == rhs); }
533 bool operator<(const BFloat16_t& rhs) const noexcept;
534};
535
536static_assert(sizeof(BFloat16_t) == sizeof(uint16_t), "Sizes must match");
537
544 uint8_t value;
545 constexpr Float8E4M3FN_t() noexcept : value(0) {}
546 constexpr Float8E4M3FN_t(uint8_t v) noexcept : value(v) {}
547 constexpr operator uint8_t() const noexcept { return value; }
548 // nan values are treated like any other value for operator ==, !=
549 constexpr bool operator==(const Float8E4M3FN_t& rhs) const noexcept { return value == rhs.value; };
550 constexpr bool operator!=(const Float8E4M3FN_t& rhs) const noexcept { return value != rhs.value; };
551};
552
553static_assert(sizeof(Float8E4M3FN_t) == sizeof(uint8_t), "Sizes must match");
554
561 uint8_t value;
562 constexpr Float8E4M3FNUZ_t() noexcept : value(0) {}
563 constexpr Float8E4M3FNUZ_t(uint8_t v) noexcept : value(v) {}
564 constexpr operator uint8_t() const noexcept { return value; }
565 // nan values are treated like any other value for operator ==, !=
566 constexpr bool operator==(const Float8E4M3FNUZ_t& rhs) const noexcept { return value == rhs.value; };
567 constexpr bool operator!=(const Float8E4M3FNUZ_t& rhs) const noexcept { return value != rhs.value; };
568};
569
570static_assert(sizeof(Float8E4M3FNUZ_t) == sizeof(uint8_t), "Sizes must match");
571
578 uint8_t value;
579 constexpr Float8E5M2_t() noexcept : value(0) {}
580 constexpr Float8E5M2_t(uint8_t v) noexcept : value(v) {}
581 constexpr operator uint8_t() const noexcept { return value; }
582 // nan values are treated like any other value for operator ==, !=
583 constexpr bool operator==(const Float8E5M2_t& rhs) const noexcept { return value == rhs.value; };
584 constexpr bool operator!=(const Float8E5M2_t& rhs) const noexcept { return value != rhs.value; };
585};
586
587static_assert(sizeof(Float8E5M2_t) == sizeof(uint8_t), "Sizes must match");
588
595 uint8_t value;
596 constexpr Float8E5M2FNUZ_t() noexcept : value(0) {}
597 constexpr Float8E5M2FNUZ_t(uint8_t v) noexcept : value(v) {}
598 constexpr operator uint8_t() const noexcept { return value; }
599 // nan values are treated like any other value for operator ==, !=
600 constexpr bool operator==(const Float8E5M2FNUZ_t& rhs) const noexcept { return value == rhs.value; };
601 constexpr bool operator!=(const Float8E5M2FNUZ_t& rhs) const noexcept { return value != rhs.value; };
602};
603
604static_assert(sizeof(Float8E5M2FNUZ_t) == sizeof(uint8_t), "Sizes must match");
605
606namespace detail {
607// This is used internally by the C++ API. This macro is to make it easy to generate overloaded methods for all of the various OrtRelease* functions for every Ort* type
608// This can't be done in the C API since C doesn't have function overloading.
609#define ORT_DEFINE_RELEASE(NAME) \
610 inline void OrtRelease(Ort##NAME* ptr) { GetApi().Release##NAME(ptr); }
611
612#define ORT_DEFINE_RELEASE_FROM_API_STRUCT(NAME, API_GETTER) \
613 inline void OrtRelease(Ort##NAME* ptr) { API_GETTER().Release##NAME(ptr); }
614
615ORT_DEFINE_RELEASE(Allocator);
616ORT_DEFINE_RELEASE(ArenaCfg);
617ORT_DEFINE_RELEASE(CustomOpDomain);
618ORT_DEFINE_RELEASE(Env);
619ORT_DEFINE_RELEASE(ExternalInitializerInfo);
620ORT_DEFINE_RELEASE(Graph);
621ORT_DEFINE_RELEASE(IoBinding);
622ORT_DEFINE_RELEASE(KernelInfo);
623ORT_DEFINE_RELEASE(KeyValuePairs);
624ORT_DEFINE_RELEASE(LoraAdapter);
625ORT_DEFINE_RELEASE(MemoryInfo);
626ORT_DEFINE_RELEASE(MapTypeInfo);
627ORT_DEFINE_RELEASE(Model);
628ORT_DEFINE_RELEASE(ModelMetadata);
629ORT_DEFINE_RELEASE(Node);
630ORT_DEFINE_RELEASE(Op);
631ORT_DEFINE_RELEASE(OpAttr);
632ORT_DEFINE_RELEASE(PrepackedWeightsContainer);
633ORT_DEFINE_RELEASE(RunOptions);
634ORT_DEFINE_RELEASE(Session);
635ORT_DEFINE_RELEASE(SessionOptions);
636ORT_DEFINE_RELEASE(SequenceTypeInfo);
637ORT_DEFINE_RELEASE(Status);
638ORT_DEFINE_RELEASE(SyncStream);
639ORT_DEFINE_RELEASE(TensorTypeAndShapeInfo);
640ORT_DEFINE_RELEASE(ThreadingOptions);
641ORT_DEFINE_RELEASE(TypeInfo);
642ORT_DEFINE_RELEASE(Value);
643ORT_DEFINE_RELEASE(ValueInfo);
644
645ORT_DEFINE_RELEASE_FROM_API_STRUCT(ModelCompilationOptions, GetCompileApi);
646ORT_DEFINE_RELEASE_FROM_API_STRUCT(EpDevice, GetEpApi);
647
648// This is defined explicitly since OrtTensorRTProviderOptionsV2 is not a C API type,
649// but the struct has V2 in its name to indicate that it is the second version of the options.
652
653#undef ORT_DEFINE_RELEASE
654#undef ORT_DEFINE_RELEASE_FROM_API_STRUCT
655
659template <typename T>
660struct Unowned {
661 using Type = T;
662};
663
683template <typename T>
684struct Base {
685 using contained_type = T;
686
687 constexpr Base() = default;
688 constexpr explicit Base(contained_type* p) noexcept : p_{p} {}
690 OrtRelease(p_);
691 }
692
693 Base(const Base&) = delete;
694 Base& operator=(const Base&) = delete;
695
696 Base(Base&& v) noexcept : p_{v.p_} { v.p_ = nullptr; }
697 Base& operator=(Base&& v) noexcept {
698 OrtRelease(p_);
699 p_ = v.release();
700 return *this;
701 }
702
703 constexpr operator contained_type*() const noexcept { return p_; }
704 constexpr contained_type& operator*() const noexcept { return *p_; }
705
709 T* p = p_;
710 p_ = nullptr;
711 return p;
712 }
713
714 protected:
716};
717
718// Undefined. For const types use Base<Unowned<const T>>
719template <typename T>
720struct Base<const T>;
721
729template <typename T>
730struct Base<Unowned<T>> {
732
733 constexpr Base() = default;
734 constexpr explicit Base(contained_type* p) noexcept : p_{p} {}
735
736 ~Base() = default;
737
738 Base(const Base&) = default;
739 Base& operator=(const Base&) = default;
740
741 Base(Base&& v) noexcept : p_{v.p_} { v.p_ = nullptr; }
742 Base& operator=(Base&& v) noexcept {
743 p_ = nullptr;
744 std::swap(p_, v.p_);
745 return *this;
746 }
747
748 constexpr operator contained_type*() const noexcept { return p_; }
749 constexpr contained_type& operator*() const noexcept { return *p_; }
750
751 protected:
753};
754
755// Light functor to release memory with OrtAllocator
758 explicit AllocatedFree(OrtAllocator* allocator)
759 : allocator_(allocator) {}
760 void operator()(void* ptr) const {
761 if (ptr) allocator_->Free(allocator_, ptr);
762 }
763};
764
765} // namespace detail
766
767struct AllocatorWithDefaultOptions;
768struct Env;
769struct EpDevice;
770struct ExternalInitializerInfo;
771struct Graph;
772struct Model;
773struct Node;
774struct ModelMetadata;
775struct TypeInfo;
776struct PrepackedWeightsContainer;
777struct Session;
778struct SessionOptions;
779struct SyncStream;
780struct TensorRTProviderOptions;
781struct Value;
782struct ValueInfo;
783
788using AllocatedStringPtr = std::unique_ptr<char, detail::AllocatedFree>;
789
794struct Status : detail::Base<OrtStatus> {
795 Status() = default; // Same as with std::nullptr_t. But can be used in re-sizable containers and represent success.
796 explicit Status(std::nullptr_t) noexcept {}
797 explicit Status(OrtStatus* status) noexcept;
798 explicit Status(const Exception&);
799 explicit Status(const std::exception&);
800 Status(const char* message, OrtErrorCode code);
801 std::string GetErrorMessage() const;
803 bool IsOK() const noexcept;
804};
805
835
840struct TensorRTProviderOptions : detail::Base<OrtTensorRTProviderOptionsV2> {
841 TensorRTProviderOptions(std::nullptr_t) {}
845 void Update(const std::unordered_map<std::string, std::string>& options);
847 void UpdateWithValue(const char* key, void* value);
848
850 void* GetOptionByName(const char* name) const;
853};
854
859struct CUDAProviderOptions : detail::Base<OrtCUDAProviderOptionsV2> {
860 CUDAProviderOptions(std::nullptr_t) {}
864 void Update(const std::unordered_map<std::string, std::string>& options);
868 void UpdateWithValue(const char* key, void* value);
870 void* GetOptionByName(const char* name) const;
871};
872
887
888namespace detail {
889template <typename T>
891 using B = Base<T>;
892 using B::B;
893
894 // Wraps OrtApi::ExternalInitializerInfo_GetFilePath
895 const std::basic_string<ORTCHAR_T> GetFilePath() const;
896 // Wraps OrtApi::ExternalInitializerInfo_GetFileOffset
897 int64_t GetFileOffset() const;
898 // Wraps OrtApi::ExternalInitializerInfo_GetByteSize
899 size_t GetByteSize() const;
900};
901} // namespace detail
902
903// Const object holder that does not own the underlying object
906
912 using Base::Base;
913
914 explicit ExternalInitializerInfo(std::nullptr_t) {}
916 : detail::ConstExternalInitializerInfoImpl<OrtExternalInitializerInfo>{p} {}
917
919
921 ExternalInitializerInfo(const ORTCHAR_T* filepath, int64_t file_offset, size_t byte_size);
922
924 static Status Create(const ORTCHAR_T* filepath, int64_t file_offset, size_t byte_size,
925 /*out*/ ExternalInitializerInfo& out);
926};
927
928namespace detail {
929template <typename T>
932 using B::B;
933
934 const char* GetValue(const char* key) const;
935
936 // get the pairs in unordered_map. needs to copy to std::string so the hash works as expected
937 std::unordered_map<std::string, std::string> GetKeyValuePairs() const;
938 // get the pairs in two vectors. entries will be 1:1 between keys and values. avoids copying to std::string
939 void GetKeyValuePairs(std::vector<const char*>& keys, std::vector<const char*>& values) const;
940};
941} // namespace detail
942
943// Const object holder that does not own the underlying object
945
947struct KeyValuePairs : detail::KeyValuePairsImpl<OrtKeyValuePairs> {
948 explicit KeyValuePairs(std::nullptr_t) {}
950 explicit KeyValuePairs(OrtKeyValuePairs* p) : KeyValuePairsImpl<OrtKeyValuePairs>{p} {}
951
953 explicit KeyValuePairs();
954
956 explicit KeyValuePairs(const std::unordered_map<std::string, std::string>& kv_pairs);
957
959 void Add(const char* key, const char* value);
960
962 void Remove(const char* key);
963
964 ConstKeyValuePairs GetConst() const { return ConstKeyValuePairs{this->p_}; }
965};
966
967namespace detail {
968template <typename T>
969struct MemoryInfoImpl : Base<T> {
970 using B = Base<T>;
971 using B::B;
972
973 std::string GetAllocatorName() const;
975 int GetDeviceId() const;
979 uint32_t GetVendorId() const;
980
981 template <typename U>
982 bool operator==(const MemoryInfoImpl<U>& o) const;
983};
984} // namespace detail
985
986// Const object holder that does not own the underlying object
988
992struct MemoryInfo : detail::MemoryInfoImpl<OrtMemoryInfo> {
994 explicit MemoryInfo(std::nullptr_t) {}
995 explicit MemoryInfo(OrtMemoryInfo* p) : MemoryInfoImpl<OrtMemoryInfo>{p} {}
996 MemoryInfo(const char* name, OrtAllocatorType type, int id, OrtMemType mem_type);
997 MemoryInfo(const char* name, OrtMemoryInfoDeviceType device_type, uint32_t vendor_id, uint32_t device_id,
998 OrtDeviceMemoryType mem_type, size_t alignment, OrtAllocatorType allocator_type);
999 ConstMemoryInfo GetConst() const { return ConstMemoryInfo{this->p_}; }
1000};
1001
1009 MemoryAllocation(OrtAllocator* allocator, void* p, size_t size);
1014 MemoryAllocation& operator=(MemoryAllocation&&) noexcept;
1015
1016 void* get() { return p_; }
1017 size_t size() const { return size_; }
1018
1019 private:
1020 OrtAllocator* allocator_;
1021 void* p_;
1022 size_t size_;
1023};
1024
1025namespace detail {
1026template <typename T>
1027struct AllocatorImpl : Base<T> {
1028 using B = Base<T>;
1029 using B::B;
1030
1031 void* Alloc(size_t size);
1032 MemoryAllocation GetAllocation(size_t size);
1033 void Free(void* p);
1034 ConstMemoryInfo GetInfo() const;
1035
1040 KeyValuePairs GetStats() const;
1041};
1042} // namespace detail
1043
1047struct AllocatorWithDefaultOptions : detail::AllocatorImpl<detail::Unowned<OrtAllocator>> {
1048 explicit AllocatorWithDefaultOptions(std::nullptr_t) {}
1050};
1051
1056struct Allocator : detail::AllocatorImpl<OrtAllocator> {
1057 explicit Allocator(std::nullptr_t) {}
1058 Allocator(const Session& session, const OrtMemoryInfo*);
1059};
1060
1061using UnownedAllocator = detail::AllocatorImpl<detail::Unowned<OrtAllocator>>;
1062
1067namespace detail {
1068template <typename T>
1070 using B = Base<T>;
1071 using B::B;
1072 // For some reason this is not a const method on the stream
1073 void* GetHandle();
1074};
1075} // namespace detail
1076
1077struct SyncStream : detail::SyncStreamImpl<OrtSyncStream> {
1079 explicit SyncStream(std::nullptr_t) {}
1081 explicit SyncStream(OrtSyncStream* p) : SyncStreamImpl<OrtSyncStream>{p} {}
1082};
1083
1085
1086namespace detail {
1087template <typename T>
1090 using B::B;
1091
1093 uint32_t VendorId() const;
1094 uint32_t DeviceId() const;
1095 const char* Vendor() const;
1097};
1098} // namespace detail
1099
1104
1105namespace detail {
1106template <typename T>
1109 using B::B;
1110
1111 const char* EpName() const;
1112 const char* EpVendor() const;
1118};
1119} // namespace detail
1120
1125
1128struct EpDevice : detail::EpDeviceImpl<OrtEpDevice> {
1129 explicit EpDevice(std::nullptr_t) {}
1130 explicit EpDevice(OrtEpDevice* p) : EpDeviceImpl<OrtEpDevice>{p} {}
1131
1133 EpDevice(OrtEpFactory& ep_factory, ConstHardwareDevice& hardware_device,
1134 ConstKeyValuePairs ep_metadata = {}, ConstKeyValuePairs ep_options = {});
1135};
1136
1144 const std::vector<ConstEpDevice>& ep_devices,
1145 const char* compatibility_info);
1146
1152struct Env : detail::Base<OrtEnv> {
1153 explicit Env(std::nullptr_t) {}
1154
1156 Env(OrtLoggingLevel logging_level = ORT_LOGGING_LEVEL_WARNING, _In_ const char* logid = "");
1157
1159 Env(OrtLoggingLevel logging_level, const char* logid, OrtLoggingFunction logging_function, void* logger_param);
1160
1162 Env(const OrtThreadingOptions* tp_options, OrtLoggingLevel logging_level = ORT_LOGGING_LEVEL_WARNING, _In_ const char* logid = "");
1163
1165 Env(const OrtThreadingOptions* tp_options, OrtLoggingFunction logging_function, void* logger_param,
1166 OrtLoggingLevel logging_level = ORT_LOGGING_LEVEL_WARNING, _In_ const char* logid = "");
1167
1169 explicit Env(OrtEnv* p) : Base<OrtEnv>{p} {}
1170
1173
1175
1176 Env& CreateAndRegisterAllocator(const OrtMemoryInfo* mem_info, const OrtArenaCfg* arena_cfg);
1177
1178 Env& CreateAndRegisterAllocatorV2(const std::string& provider_type, const OrtMemoryInfo* mem_info,
1179 const std::unordered_map<std::string, std::string>& options,
1180 const OrtArenaCfg* arena_cfg);
1181
1183
1185
1187 OrtAllocatorType allocator_type,
1188 const OrtKeyValuePairs* allocator_options);
1189
1190 // Result may be nullptr
1192
1194 OrtDeviceMemoryType mem_type);
1195
1196 Env& RegisterExecutionProviderLibrary(const char* registration_name, const std::basic_string<ORTCHAR_T>& path);
1197 Env& UnregisterExecutionProviderLibrary(const char* registration_name);
1198
1199 std::vector<ConstEpDevice> GetEpDevices() const;
1200
1201 Status CopyTensors(const std::vector<Value>& src_tensors,
1202 const std::vector<Value>& dst_tensors,
1203 OrtSyncStream* stream) const;
1204};
1205
1209struct CustomOpDomain : detail::Base<OrtCustomOpDomain> {
1211 using Base::Base;
1212
1213 explicit CustomOpDomain(std::nullptr_t) {}
1214
1216 explicit CustomOpDomain(const char* domain);
1217
1218 // This does not take ownership of the op, simply registers it.
1219 void Add(const OrtCustomOp* op);
1220};
1221
1223struct LoraAdapter : detail::Base<OrtLoraAdapter> {
1225 using Base::Base;
1226
1227 explicit LoraAdapter(std::nullptr_t) {}
1234 static LoraAdapter CreateLoraAdapter(const std::basic_string<ORTCHAR_T>& adapter_path,
1235 OrtAllocator* allocator);
1236
1244 static LoraAdapter CreateLoraAdapterFromArray(const void* bytes, size_t num_bytes,
1245 OrtAllocator* allocator);
1246};
1247
1251struct RunOptions : detail::Base<OrtRunOptions> {
1252 explicit RunOptions(std::nullptr_t) {}
1254
1257
1260
1261 RunOptions& SetRunTag(const char* run_tag);
1262 const char* GetRunTag() const;
1263
1264 RunOptions& AddConfigEntry(const char* config_key, const char* config_value);
1265 const char* GetConfigEntry(const char* config_key);
1266
1273
1279
1287};
1288
1289namespace detail {
1290// Utility function that returns a SessionOption config entry key for a specific custom operator.
1291// Ex: custom_op.[custom_op_name].[config]
1292std::string MakeCustomOpConfigEntryKey(const char* custom_op_name, const char* config);
1293} // namespace detail
1294
1305 CustomOpConfigs() = default;
1306 ~CustomOpConfigs() = default;
1311
1320 CustomOpConfigs& AddConfig(const char* custom_op_name, const char* config_key, const char* config_value);
1321
1330 const std::unordered_map<std::string, std::string>& GetFlattenedConfigs() const;
1331
1332 private:
1333 std::unordered_map<std::string, std::string> flat_configs_;
1334};
1335
1341namespace detail {
1342// we separate const-only methods because passing const ptr to non-const methods
1343// is only discovered when inline methods are compiled which is counter-intuitive
1344template <typename T>
1345struct ConstSessionOptionsImpl : Base<T> {
1346 using B = Base<T>;
1347 using B::B;
1348
1349 SessionOptions Clone() const;
1350
1351 std::string GetConfigEntry(const char* config_key) const;
1352 bool HasConfigEntry(const char* config_key) const;
1353 std::string GetConfigEntryOrDefault(const char* config_key, const std::string& def) const;
1354};
1355
1356template <typename T>
1357struct SessionOptionsImpl : ConstSessionOptionsImpl<T> {
1358 using B = ConstSessionOptionsImpl<T>;
1359 using B::B;
1360
1361 SessionOptionsImpl& SetIntraOpNumThreads(int intra_op_num_threads);
1362 SessionOptionsImpl& SetInterOpNumThreads(int inter_op_num_threads);
1363 SessionOptionsImpl& SetGraphOptimizationLevel(GraphOptimizationLevel graph_optimization_level);
1364 SessionOptionsImpl& SetDeterministicCompute(bool value);
1365
1366 SessionOptionsImpl& EnableCpuMemArena();
1367 SessionOptionsImpl& DisableCpuMemArena();
1368
1369 SessionOptionsImpl& SetOptimizedModelFilePath(const ORTCHAR_T* optimized_model_file);
1370
1371 SessionOptionsImpl& EnableProfiling(const ORTCHAR_T* profile_file_prefix);
1372 SessionOptionsImpl& DisableProfiling();
1373
1374 SessionOptionsImpl& EnableOrtCustomOps();
1375
1376 SessionOptionsImpl& EnableMemPattern();
1377 SessionOptionsImpl& DisableMemPattern();
1378
1379 SessionOptionsImpl& SetExecutionMode(ExecutionMode execution_mode);
1380
1381 SessionOptionsImpl& SetLoadCancellationFlag(bool value);
1382
1383 SessionOptionsImpl& SetLogId(const char* logid);
1384 SessionOptionsImpl& SetLogSeverityLevel(int level);
1385
1386 SessionOptionsImpl& Add(OrtCustomOpDomain* custom_op_domain);
1387
1388 SessionOptionsImpl& DisablePerSessionThreads();
1389
1390 SessionOptionsImpl& AddConfigEntry(const char* config_key, const char* config_value);
1391
1392 SessionOptionsImpl& AddInitializer(const char* name, const OrtValue* ort_val);
1393 SessionOptionsImpl& AddExternalInitializers(const std::vector<std::string>& names, const std::vector<Value>& ort_values);
1394 SessionOptionsImpl& AddExternalInitializersFromFilesInMemory(const std::vector<std::basic_string<ORTCHAR_T>>& external_initializer_file_names,
1395 const std::vector<char*>& external_initializer_file_buffer_array,
1396 const std::vector<size_t>& external_initializer_file_lengths);
1397
1398 SessionOptionsImpl& AppendExecutionProvider_CPU(int use_arena);
1399 SessionOptionsImpl& AppendExecutionProvider_CUDA(const OrtCUDAProviderOptions& provider_options);
1400 SessionOptionsImpl& AppendExecutionProvider_CUDA_V2(const OrtCUDAProviderOptionsV2& provider_options);
1401 SessionOptionsImpl& AppendExecutionProvider_ROCM(const OrtROCMProviderOptions& provider_options);
1402 SessionOptionsImpl& AppendExecutionProvider_OpenVINO(const OrtOpenVINOProviderOptions& provider_options);
1404 SessionOptionsImpl& AppendExecutionProvider_OpenVINO_V2(const std::unordered_map<std::string, std::string>& provider_options = {});
1405 SessionOptionsImpl& AppendExecutionProvider_TensorRT(const OrtTensorRTProviderOptions& provider_options);
1406 SessionOptionsImpl& AppendExecutionProvider_TensorRT_V2(const OrtTensorRTProviderOptionsV2& provider_options);
1407 SessionOptionsImpl& AppendExecutionProvider_MIGraphX(const OrtMIGraphXProviderOptions& provider_options);
1409 SessionOptionsImpl& AppendExecutionProvider_CANN(const OrtCANNProviderOptions& provider_options);
1411 SessionOptionsImpl& AppendExecutionProvider_Dnnl(const OrtDnnlProviderOptions& provider_options);
1413 SessionOptionsImpl& AppendExecutionProvider(const std::string& provider_name,
1414 const std::unordered_map<std::string, std::string>& provider_options = {});
1415
1418 SessionOptionsImpl& AppendExecutionProvider_V2(Env& env, const std::vector<ConstEpDevice>& ep_devices,
1419 const KeyValuePairs& ep_options);
1422 SessionOptionsImpl& AppendExecutionProvider_V2(Env& env, const std::vector<ConstEpDevice>& ep_devices,
1423 const std::unordered_map<std::string, std::string>& ep_options);
1424
1426 SessionOptionsImpl& SetEpSelectionPolicy(OrtExecutionProviderDevicePolicy policy);
1427
1429 SessionOptionsImpl& SetEpSelectionPolicy(EpSelectionDelegate delegate, void* state = nullptr);
1430
1431 SessionOptionsImpl& SetCustomCreateThreadFn(OrtCustomCreateThreadFn ort_custom_create_thread_fn);
1432 SessionOptionsImpl& SetCustomThreadCreationOptions(void* ort_custom_thread_creation_options);
1433 SessionOptionsImpl& SetCustomJoinThreadFn(OrtCustomJoinThreadFn ort_custom_join_thread_fn);
1434
1438 SessionOptionsImpl& RegisterCustomOpsLibrary(const ORTCHAR_T* library_name, const CustomOpConfigs& custom_op_configs = {});
1439
1440 SessionOptionsImpl& RegisterCustomOpsUsingFunction(const char* function_name);
1441
1443 SessionOptionsImpl& AppendExecutionProvider_VitisAI(const std::unordered_map<std::string, std::string>& provider_options = {});
1444};
1445} // namespace detail
1446
1447using UnownedSessionOptions = detail::SessionOptionsImpl<detail::Unowned<OrtSessionOptions>>;
1448using ConstSessionOptions = detail::ConstSessionOptionsImpl<detail::Unowned<const OrtSessionOptions>>;
1449
1453struct SessionOptions : detail::SessionOptionsImpl<OrtSessionOptions> {
1454 explicit SessionOptions(std::nullptr_t) {}
1456 explicit SessionOptions(OrtSessionOptions* p) : SessionOptionsImpl<OrtSessionOptions>{p} {}
1459};
1460
1465struct ModelCompilationOptions : detail::Base<OrtModelCompilationOptions> {
1467 using Base::Base;
1468
1469 explicit ModelCompilationOptions(std::nullptr_t) {}
1470
1471 ModelCompilationOptions(const Env& env, const SessionOptions& session_options);
1472 ModelCompilationOptions(const Env& env, ConstSessionOptions session_options);
1473
1474 ModelCompilationOptions& SetInputModelPath(const ORTCHAR_T* input_model_path);
1476 size_t input_model_data_size);
1477 ModelCompilationOptions& SetEpContextEmbedMode(bool embed_ep_context_in_model);
1478 ModelCompilationOptions& SetOutputModelPath(const ORTCHAR_T* output_model_path);
1480 size_t initializer_size_threshold);
1481
1484 OrtGetInitializerLocationFunc get_initializer_location_func,
1485 void* state);
1486
1487 ModelCompilationOptions& SetOutputModelBuffer(OrtAllocator* allocator, void** output_model_buffer_ptr,
1488 size_t* output_model_buffer_size_ptr);
1489
1492
1493 ModelCompilationOptions& SetEpContextBinaryInformation(const ORTCHAR_T* output_directory,
1494 const ORTCHAR_T* model_name);
1496
1498};
1499
1506Status CompileModel(const Env& env, const ModelCompilationOptions& model_compilation_options);
1507
1511struct ModelMetadata : detail::Base<OrtModelMetadata> {
1513 using Base::Base;
1514
1515 explicit ModelMetadata(std::nullptr_t) {}
1516
1524
1532
1540
1548
1556
1563 std::vector<AllocatedStringPtr> GetCustomMetadataMapKeysAllocated(OrtAllocator* allocator) const;
1564
1575
1576 int64_t GetVersion() const;
1577};
1578
1579struct IoBinding;
1580
1581namespace detail {
1582
1583// we separate const-only methods because passing const ptr to non-const methods
1584// is only discovered when inline methods are compiled which is counter-intuitive
1585template <typename T>
1587 using B = Base<T>;
1588 using B::B;
1589
1590 size_t GetInputCount() const;
1591 size_t GetOutputCount() const;
1593
1594 std::vector<std::string> GetInputNames() const;
1595 std::vector<std::string> GetOutputNames() const;
1596 std::vector<std::string> GetOverridableInitializerNames() const;
1597
1598 std::vector<ConstMemoryInfo> GetMemoryInfoForInputs() const;
1599 std::vector<ConstMemoryInfo> GetMemoryInfoForOutputs() const;
1600 std::vector<ConstEpDevice> GetEpDeviceForInputs() const;
1601
1610
1619
1628
1629 uint64_t GetProfilingStartTimeNs() const;
1631
1632 TypeInfo GetInputTypeInfo(size_t index) const;
1633 TypeInfo GetOutputTypeInfo(size_t index) const;
1635
1636 int GetOpset(const std::string& domain) const;
1637
1638 // Will move before checkin if that's the case.
1639 std::vector<ValueInfo> GetInputs() const;
1640 std::vector<ValueInfo> GetOutputs() const;
1641};
1642
1643template <typename T>
1646 using B::B;
1647
1665 std::vector<Value> Run(const RunOptions& run_options, const char* const* input_names, const Value* input_values, size_t input_count,
1666 const char* const* output_names, size_t output_count);
1667
1671 void Run(const RunOptions& run_options, const char* const* input_names, const Value* input_values, size_t input_count,
1672 const char* const* output_names, Value* output_values, size_t output_count);
1673
1674 void Run(const RunOptions& run_options, const IoBinding&);
1675
1695 void RunAsync(const RunOptions& run_options, const char* const* input_names, const Value* input_values, size_t input_count,
1696 const char* const* output_names, Value* output_values, size_t output_count, RunAsyncCallbackFn callback, void* user_data);
1697
1705
1717 void SetEpDynamicOptions(const char* const* keys, const char* const* values, size_t kv_len);
1718
1719 void FinalizeModelEditorSession(const Model& model, const SessionOptions& options,
1720 OrtPrepackedWeightsContainer* prepacked_weights_container = nullptr);
1721};
1722
1723} // namespace detail
1724
1727
1731struct Session : detail::SessionImpl<OrtSession> {
1733 explicit Session(std::nullptr_t) {}
1734 explicit Session(OrtSession* p) : SessionImpl{p} {}
1735
1736 Session(const Env& env, const ORTCHAR_T* model_path, const SessionOptions& options);
1737
1739 Session(const Env& env, const ORTCHAR_T* model_path, const SessionOptions& options,
1740 OrtPrepackedWeightsContainer* prepacked_weights_container);
1741
1743 Session(const Env& env, const void* model_data, size_t model_data_length, const SessionOptions& options);
1744
1746 Session(const Env& env, const void* model_data, size_t model_data_length, const SessionOptions& options,
1747 OrtPrepackedWeightsContainer* prepacked_weights_container);
1748
1749#if !defined(ORT_MINIMAL_BUILD)
1751 Session(const Env& env, const Model& model, const SessionOptions& options);
1752
1754 static Session CreateModelEditorSession(const Env& env, const ORTCHAR_T* model_path, const SessionOptions& options);
1755
1757 static Session CreateModelEditorSession(const Env& env, const void* model_data, size_t model_data_length,
1758 const SessionOptions& options);
1759#endif // !defined(ORT_MINIMAL_BUILD)
1760
1761 ConstSession GetConst() const { return ConstSession{this->p_}; }
1762 UnownedSession GetUnowned() const { return UnownedSession{this->p_}; }
1763};
1764
1765namespace detail {
1766template <typename T>
1768 using B = Base<T>;
1769 using B::B;
1770
1772 size_t GetElementCount() const;
1773
1774 size_t GetDimensionsCount() const;
1775
1780 [[deprecated("use GetShape()")]] void GetDimensions(int64_t* values, size_t values_count) const;
1781
1782 void GetSymbolicDimensions(const char** values, size_t values_count) const;
1783 std::vector<const char*> GetSymbolicDimensions() const;
1784
1785 bool HasShape() const;
1786 std::vector<int64_t> GetShape() const;
1787};
1788
1789} // namespace detail
1790
1792
1798 using Base::Base;
1799
1801 explicit TensorTypeAndShapeInfo(std::nullptr_t) {}
1803 explicit TensorTypeAndShapeInfo(OrtTensorTypeAndShapeInfo* p) : TensorTypeAndShapeInfoImpl{p} {}
1804
1805 // Create a TensorTypeAndShapeInfo object with the specified element type and dimensions
1806 // symbolic_dims are optional, but should be 1:1 with dims.
1807 // The value in symbolic_dims will be used for all entries in dims that are -1.
1809 const std::vector<int64_t>& dims,
1810 const std::vector<std::string>* symbolic_dims = nullptr);
1811
1813};
1814
1815namespace detail {
1816template <typename T>
1818 using B = Base<T>;
1819 using B::B;
1821};
1822
1823} // namespace detail
1824
1826
1830struct SequenceTypeInfo : detail::SequenceTypeInfoImpl<OrtSequenceTypeInfo> {
1832 using Base::Base;
1833
1834 explicit SequenceTypeInfo(std::nullptr_t) {}
1835 explicit SequenceTypeInfo(OrtSequenceTypeInfo* p) : SequenceTypeInfoImpl<OrtSequenceTypeInfo>{p} {}
1837};
1838
1839namespace detail {
1840template <typename T>
1842 using B = Base<T>;
1843 using B::B;
1845};
1846
1847} // namespace detail
1848
1849// This is always owned by the TypeInfo and can only be obtained from it.
1851
1852namespace detail {
1853template <typename T>
1860
1861} // namespace detail
1862
1864
1868struct MapTypeInfo : detail::MapTypeInfoImpl<OrtMapTypeInfo> {
1870 using Base::Base;
1871
1872 explicit MapTypeInfo(std::nullptr_t) {}
1873 explicit MapTypeInfo(OrtMapTypeInfo* p) : MapTypeInfoImpl<OrtMapTypeInfo>{p} {}
1874 ConstMapTypeInfo GetConst() const { return ConstMapTypeInfo{this->p_}; }
1875};
1876
1877namespace detail {
1878template <typename T>
1890} // namespace detail
1891
1897
1902struct TypeInfo : detail::TypeInfoImpl<OrtTypeInfo> {
1904 using Base::Base;
1905
1907 explicit TypeInfo(std::nullptr_t) {}
1908 explicit TypeInfo(OrtTypeInfo* p) : TypeInfoImpl<OrtTypeInfo>{p} {}
1909
1910#if !defined(ORT_MINIMAL_BUILD)
1916#endif // !defined(ORT_MINIMAL_BUILD)
1917
1918 ConstTypeInfo GetConst() const { return ConstTypeInfo{this->p_}; }
1919};
1920
1921namespace detail {
1922// This structure is used to feed sparse tensor values
1923// information for use with FillSparseTensor<Format>() API
1924// if the data type for the sparse tensor values is numeric
1925// use data.p_data, otherwise, use data.str pointer to feed
1926// values. data.str is an array of const char* that are zero terminated.
1927// number of strings in the array must match shape size.
1928// For fully sparse tensors use shape {0} and set p_data/str
1929// to nullptr.
1931 const int64_t* values_shape;
1933 union {
1934 const void* p_data;
1935 const char** str;
1936 } data;
1937};
1938
1939// Provides a way to pass shape in a single
1940// argument
1941struct Shape {
1942 const int64_t* shape;
1944};
1945
1946template <typename T>
1948 using B = Base<T>;
1949 using B::B;
1950
1954 template <typename R>
1955 void GetOpaqueData(const char* domain, const char* type_name, R&) const;
1956
1957 bool IsTensor() const;
1958 bool HasValue() const;
1959
1960 size_t GetCount() const; // If a non tensor, returns 2 for map and N for sequence, where N is the number of elements
1961 Value GetValue(int index, OrtAllocator* allocator) const;
1962
1970
1985 void GetStringTensorContent(void* buffer, size_t buffer_length, size_t* offsets, size_t offsets_count) const;
1986
1993 template <typename R>
1994 const R* GetTensorData() const;
1995
2000 const void* GetTensorRawData() const;
2001
2009
2017
2023
2032 void GetStringTensorElement(size_t buffer_length, size_t element_index, void* buffer) const;
2033
2040 std::string GetStringTensorElement(size_t element_index) const;
2041
2048 size_t GetStringTensorElementLength(size_t element_index) const;
2049
2056 size_t GetTensorSizeInBytes() const;
2057
2058#if !defined(DISABLE_SPARSE_TENSORS)
2066
2073
2082
2092 template <typename R>
2093 const R* GetSparseTensorIndicesData(OrtSparseIndicesFormat indices_format, size_t& num_indices) const;
2094
2099 bool IsSparseTensor() const;
2100
2109 template <typename R>
2110 const R* GetSparseTensorValues() const;
2111
2112#endif
2113};
2114
2115template <typename T>
2118 using B::B;
2119
2125 template <typename R>
2127
2133
2135 // Obtain a reference to an element of data at the location specified
2141 template <typename R>
2142 R& At(const std::vector<int64_t>& location);
2143
2149 void FillStringTensor(const char* const* s, size_t s_len);
2150
2156 void FillStringTensorElement(const char* s, size_t index);
2157
2170 char* GetResizedStringTensorElementBuffer(size_t index, size_t buffer_length);
2171
2172#if !defined(DISABLE_SPARSE_TENSORS)
2181 void UseCooIndices(int64_t* indices_data, size_t indices_num);
2182
2193 void UseCsrIndices(int64_t* inner_data, size_t inner_num, int64_t* outer_data, size_t outer_num);
2194
2203 void UseBlockSparseIndices(const Shape& indices_shape, int32_t* indices_data);
2204
2214 void FillSparseTensorCoo(const OrtMemoryInfo* data_mem_info, const OrtSparseValuesParam& values_param,
2215 const int64_t* indices_data, size_t indices_num);
2216
2228 void FillSparseTensorCsr(const OrtMemoryInfo* data_mem_info,
2229 const OrtSparseValuesParam& values,
2230 const int64_t* inner_indices_data, size_t inner_indices_num,
2231 const int64_t* outer_indices_data, size_t outer_indices_num);
2232
2243 const OrtSparseValuesParam& values,
2244 const Shape& indices_shape,
2245 const int32_t* indices_data);
2246
2247#endif
2248};
2249
2250} // namespace detail
2251
2254
2258struct Value : detail::ValueImpl<OrtValue> {
2260 using Base::Base;
2263
2264 Value(std::nullptr_t) {}
2265 Value(Value&&) = default;
2266 Value& operator=(Value&&) = default;
2267
2268 ConstValue GetConst() const { return ConstValue{this->p_}; }
2269 UnownedValue GetUnowned() const { return UnownedValue{this->p_}; }
2270
2279 template <typename T>
2280 static Value CreateTensor(const OrtMemoryInfo* info, T* p_data, size_t p_data_element_count,
2281 const int64_t* shape, size_t shape_len);
2282
2292 static Value CreateTensor(const OrtMemoryInfo* info, void* p_data, size_t p_data_byte_count,
2293 const int64_t* shape, size_t shape_len,
2295
2305 static Value CreateTensor(OrtAllocator* deleter, void* p_data, size_t p_data_byte_count,
2306 const int64_t* shape, size_t shape_len,
2308
2320 template <typename T>
2321 static Value CreateTensor(OrtAllocator* allocator, const int64_t* shape, size_t shape_len);
2322
2334 static Value CreateTensor(OrtAllocator* allocator, const int64_t* shape, size_t shape_len,
2336
2345 static Value CreateMap(const Value& keys, const Value& values);
2346
2354 static Value CreateSequence(const std::vector<Value>& values);
2355
2364 template <typename T>
2365 static Value CreateOpaque(const char* domain, const char* type_name, const T& value);
2366
2367#if !defined(DISABLE_SPARSE_TENSORS)
2378 template <typename T>
2379 static Value CreateSparseTensor(const OrtMemoryInfo* info, T* p_data, const Shape& dense_shape,
2380 const Shape& values_shape);
2381
2398 static Value CreateSparseTensor(const OrtMemoryInfo* info, void* p_data, const Shape& dense_shape,
2399 const Shape& values_shape, ONNXTensorElementDataType type);
2400
2410 template <typename T>
2411 static Value CreateSparseTensor(OrtAllocator* allocator, const Shape& dense_shape);
2412
2424 static Value CreateSparseTensor(OrtAllocator* allocator, const Shape& dense_shape, ONNXTensorElementDataType type);
2425
2426#endif // !defined(DISABLE_SPARSE_TENSORS)
2427};
2428
2429namespace detail {
2430namespace binding_utils {
2431// Bring these out of template
2432std::vector<std::string> GetOutputNamesHelper(const OrtIoBinding* binding, OrtAllocator*);
2433std::vector<Value> GetOutputValuesHelper(const OrtIoBinding* binding, OrtAllocator*);
2434} // namespace binding_utils
2435
2436template <typename T>
2438 using B = Base<T>;
2439 using B::B;
2440
2441 std::vector<std::string> GetOutputNames() const;
2442 std::vector<std::string> GetOutputNames(OrtAllocator*) const;
2443 std::vector<Value> GetOutputValues() const;
2444 std::vector<Value> GetOutputValues(OrtAllocator*) const;
2445};
2446
2447template <typename T>
2450 using B::B;
2451
2452 void BindInput(const char* name, const Value&);
2453 void BindOutput(const char* name, const Value&);
2454 void BindOutput(const char* name, const OrtMemoryInfo*);
2459};
2460
2461} // namespace detail
2462
2465
2469struct IoBinding : detail::IoBindingImpl<OrtIoBinding> {
2470 explicit IoBinding(std::nullptr_t) {}
2471 explicit IoBinding(Session& session);
2472 ConstIoBinding GetConst() const { return ConstIoBinding{this->p_}; }
2473 UnownedIoBinding GetUnowned() const { return UnownedIoBinding{this->p_}; }
2474};
2475
2480struct ArenaCfg : detail::Base<OrtArenaCfg> {
2481 explicit ArenaCfg(std::nullptr_t) {}
2490 ArenaCfg(size_t max_mem, int arena_extend_strategy, int initial_chunk_size_bytes, int max_dead_bytes_per_chunk);
2491
2496 explicit ArenaCfg(const std::unordered_map<std::string, size_t>& arena_config);
2497};
2498
2499//
2500// Custom OPs (only needed to implement custom OPs)
2501//
2502
2503namespace detail {
2504// Need to define a templated ConstOpAttr with const members
2505template <typename T>
2508 using B::B;
2509
2510 // Wraps OrtApi::OpAttr_GetName
2511 std::string GetName() const;
2512 // Wraps OrtApi::OpAttr_GetType
2514
2515 // Wraps OrtApi::ReadAttr for a single value
2516 // This does not support Tensor Attribute
2517 // Call GetTensorAttributeAsOrtValue() instead.
2518 template <typename R>
2519 Status GetValue(R& out) const;
2520
2521 // Wraps OrtApi::ReadAttr for an array of values
2522 template <typename R>
2523 Status GetValueArray(std::vector<R>& out) const;
2524 // Wraps OrtApi::OpAttr_GetTensorAttributeAsOrtValue
2526};
2527} // namespace detail
2528
2530
2534struct OpAttr : detail::ConstOpAttrImpl<OrtOpAttr> {
2536 using Base::Base;
2537
2538 OpAttr() = default; // Enable storing it in the container for resize()
2539 explicit OpAttr(std::nullptr_t) {}
2540 OpAttr(const char* name, const void* data, int len, OrtOpAttrType type);
2541
2542 ConstOpAttr GetConst() const { return ConstOpAttr{this->p_}; }
2543};
2544
2553#define ORT_CXX_LOG(logger, message_severity, message) \
2554 do { \
2555 if (message_severity >= logger.GetLoggingSeverityLevel()) { \
2556 Ort::ThrowOnError(logger.LogMessage(message_severity, ORT_FILE, __LINE__, \
2557 static_cast<const char*>(__FUNCTION__), message)); \
2558 } \
2559 } while (false)
2560
2569#define ORT_CXX_LOG_NOEXCEPT(logger, message_severity, message) \
2570 do { \
2571 if (message_severity >= logger.GetLoggingSeverityLevel()) { \
2572 static_cast<void>(logger.LogMessage(message_severity, ORT_FILE, __LINE__, \
2573 static_cast<const char*>(__FUNCTION__), message)); \
2574 } \
2575 } while (false)
2576
2588#define ORT_CXX_LOGF(logger, message_severity, /*format,*/...) \
2589 do { \
2590 if (message_severity >= logger.GetLoggingSeverityLevel()) { \
2591 Ort::ThrowOnError(logger.LogFormattedMessage(message_severity, ORT_FILE, __LINE__, \
2592 static_cast<const char*>(__FUNCTION__), __VA_ARGS__)); \
2593 } \
2594 } while (false)
2595
2607#define ORT_CXX_LOGF_NOEXCEPT(logger, message_severity, /*format,*/...) \
2608 do { \
2609 if (message_severity >= logger.GetLoggingSeverityLevel()) { \
2610 static_cast<void>(logger.LogFormattedMessage(message_severity, ORT_FILE, __LINE__, \
2611 static_cast<const char*>(__FUNCTION__), __VA_ARGS__)); \
2612 } \
2613 } while (false)
2614
2625struct Logger {
2629 Logger() = default;
2630
2634 explicit Logger(std::nullptr_t) {}
2635
2642 explicit Logger(const OrtLogger* logger);
2643
2644 ~Logger() = default;
2645
2646 Logger(const Logger&) = default;
2647 Logger& operator=(const Logger&) = default;
2648
2649 Logger(Logger&& v) noexcept = default;
2650 Logger& operator=(Logger&& v) noexcept = default;
2651
2658
2671 Status LogMessage(OrtLoggingLevel log_severity_level, const ORTCHAR_T* file_path, int line_number,
2672 const char* func_name, const char* message) const noexcept;
2673
2688 template <typename... Args>
2689 Status LogFormattedMessage(OrtLoggingLevel log_severity_level, const ORTCHAR_T* file_path, int line_number,
2690 const char* func_name, const char* format, Args&&... args) const noexcept;
2691
2692 private:
2693 const OrtLogger* logger_{};
2694 OrtLoggingLevel cached_severity_level_{};
2695};
2696
2705 size_t GetInputCount() const;
2706 size_t GetOutputCount() const;
2707 // If input is optional and is not present, the method returns an empty ConstValue
2708 // which can be compared to nullptr.
2709 ConstValue GetInput(size_t index) const;
2710 // If output is optional and is not present, the method returns an empty UnownedValue
2711 // which can be compared to nullptr.
2712 UnownedValue GetOutput(size_t index, const int64_t* dim_values, size_t dim_count) const;
2713 UnownedValue GetOutput(size_t index, const std::vector<int64_t>& dims) const;
2714 void* GetGPUComputeStream() const;
2716 OrtAllocator* GetAllocator(const OrtMemoryInfo& memory_info) const;
2717 OrtKernelContext* GetOrtKernelContext() const { return ctx_; }
2718 void ParallelFor(void (*fn)(void*, size_t), size_t total, size_t num_batch, void* usr_data) const;
2719
2720 private:
2721 OrtKernelContext* ctx_;
2722};
2723
2724struct KernelInfo;
2725
2726namespace detail {
2727namespace attr_utils {
2728void GetAttr(const OrtKernelInfo* p, const char* name, float&);
2729void GetAttr(const OrtKernelInfo* p, const char* name, int64_t&);
2730void GetAttr(const OrtKernelInfo* p, const char* name, std::string&);
2731void GetAttrs(const OrtKernelInfo* p, const char* name, std::vector<float>&);
2732void GetAttrs(const OrtKernelInfo* p, const char* name, std::vector<int64_t>&);
2733} // namespace attr_utils
2734
2735template <typename T>
2736struct KernelInfoImpl : Base<T> {
2737 using B = Base<T>;
2738 using B::B;
2739
2740 KernelInfo Copy() const;
2741
2742 template <typename R> // R is only implemented for float, int64_t, and string
2743 R GetAttribute(const char* name) const {
2744 R val;
2745 attr_utils::GetAttr(this->p_, name, val);
2746 return val;
2747 }
2748
2749 template <typename R> // R is only implemented for std::vector<float>, std::vector<int64_t>
2750 std::vector<R> GetAttributes(const char* name) const {
2751 std::vector<R> result;
2752 attr_utils::GetAttrs(this->p_, name, result);
2753 return result;
2754 }
2755
2756 Value GetTensorAttribute(const char* name, OrtAllocator* allocator) const;
2757
2758 size_t GetInputCount() const;
2759 size_t GetOutputCount() const;
2760
2761 std::string GetInputName(size_t index) const;
2762 std::string GetOutputName(size_t index) const;
2763
2764 TypeInfo GetInputTypeInfo(size_t index) const;
2765 TypeInfo GetOutputTypeInfo(size_t index) const;
2766
2767 ConstValue GetTensorConstantInput(size_t index, int* is_constant) const;
2768
2769 std::string GetNodeName() const;
2770 Logger GetLogger() const;
2771};
2772
2773} // namespace detail
2774
2775using ConstKernelInfo = detail::KernelInfoImpl<detail::Unowned<const OrtKernelInfo>>;
2776
2783struct KernelInfo : detail::KernelInfoImpl<OrtKernelInfo> {
2784 using Base = detail::KernelInfoImpl<OrtKernelInfo>;
2785 using Base::Base;
2786 explicit KernelInfo(std::nullptr_t) {}
2787 explicit KernelInfo(OrtKernelInfo* info);
2788 ConstKernelInfo GetConst() const { return ConstKernelInfo{this->p_}; }
2789};
2790
2794struct Op : detail::Base<OrtOp> {
2796 using Base::Base;
2797
2798 explicit Op(std::nullptr_t) {}
2799
2800 explicit Op(OrtOp*);
2801
2802 static Op Create(const OrtKernelInfo* info, const char* op_name, const char* domain,
2803 int version, const char** type_constraint_names,
2804 const ONNXTensorElementDataType* type_constraint_values,
2805 size_t type_constraint_count,
2806 const OpAttr* attr_values,
2807 size_t attr_count,
2808 size_t input_count, size_t output_count);
2809
2810 void Invoke(const OrtKernelContext* context,
2811 const Value* input_values,
2812 size_t input_count,
2813 Value* output_values,
2814 size_t output_count);
2815
2816 // For easier refactoring
2817 void Invoke(const OrtKernelContext* context,
2818 const OrtValue* const* input_values,
2819 size_t input_count,
2820 OrtValue* const* output_values,
2821 size_t output_count);
2822};
2823
2829 SymbolicInteger(int64_t i) : i_(i), is_int_(true) {};
2830 SymbolicInteger(const char* s) : s_(s), is_int_(false) {};
2833
2836
2837 bool operator==(const SymbolicInteger& dim) const {
2838 if (is_int_ == dim.is_int_) {
2839 if (is_int_) {
2840 return i_ == dim.i_;
2841 } else {
2842 return std::string{s_} == std::string{dim.s_};
2843 }
2844 }
2845 return false;
2846 }
2847
2848 bool IsInt() const { return is_int_; }
2849 int64_t AsInt() const { return i_; }
2850 const char* AsSym() const { return s_; }
2851
2852 static constexpr int INVALID_INT_DIM = -2;
2853
2854 private:
2855 union {
2856 int64_t i_;
2857 const char* s_;
2858 };
2859 bool is_int_;
2860 };
2861
2862 using Shape = std::vector<SymbolicInteger>;
2863
2865
2866 const Shape& GetInputShape(size_t indice) const { return input_shapes_.at(indice); }
2867
2868 size_t GetInputCount() const { return input_shapes_.size(); }
2869
2871
2872 int64_t GetAttrInt(const char* attr_name);
2873
2874 using Ints = std::vector<int64_t>;
2875 Ints GetAttrInts(const char* attr_name);
2876
2877 float GetAttrFloat(const char* attr_name);
2878
2879 using Floats = std::vector<float>;
2880 Floats GetAttrFloats(const char* attr_name);
2881
2882 std::string GetAttrString(const char* attr_name);
2883
2884 using Strings = std::vector<std::string>;
2885 Strings GetAttrStrings(const char* attr_name);
2886
2887 private:
2888 ConstOpAttr GetAttrHdl(const char* attr_name) const;
2889 const OrtApi* ort_api_;
2891 std::vector<Shape> input_shapes_;
2892};
2893
2895
2896#define MAX_CUSTOM_OP_END_VER (1UL << 31) - 1
2897
2898template <typename TOp, typename TKernel, bool WithStatus = false>
2902 OrtCustomOp::GetName = [](const OrtCustomOp* this_) { return static_cast<const TOp*>(this_)->GetName(); };
2903
2904 OrtCustomOp::GetExecutionProviderType = [](const OrtCustomOp* this_) { return static_cast<const TOp*>(this_)->GetExecutionProviderType(); };
2905
2906 OrtCustomOp::GetInputTypeCount = [](const OrtCustomOp* this_) { return static_cast<const TOp*>(this_)->GetInputTypeCount(); };
2907 OrtCustomOp::GetInputType = [](const OrtCustomOp* this_, size_t index) { return static_cast<const TOp*>(this_)->GetInputType(index); };
2908 OrtCustomOp::GetInputMemoryType = [](const OrtCustomOp* this_, size_t index) { return static_cast<const TOp*>(this_)->GetInputMemoryType(index); };
2909
2910 OrtCustomOp::GetOutputTypeCount = [](const OrtCustomOp* this_) { return static_cast<const TOp*>(this_)->GetOutputTypeCount(); };
2911 OrtCustomOp::GetOutputType = [](const OrtCustomOp* this_, size_t index) { return static_cast<const TOp*>(this_)->GetOutputType(index); };
2912
2913#if defined(_MSC_VER) && !defined(__clang__)
2914#pragma warning(push)
2915#pragma warning(disable : 26409)
2916#endif
2917 OrtCustomOp::KernelDestroy = [](void* op_kernel) { delete static_cast<TKernel*>(op_kernel); };
2918#if defined(_MSC_VER) && !defined(__clang__)
2919#pragma warning(pop)
2920#endif
2921 OrtCustomOp::GetInputCharacteristic = [](const OrtCustomOp* this_, size_t index) { return static_cast<const TOp*>(this_)->GetInputCharacteristic(index); };
2922 OrtCustomOp::GetOutputCharacteristic = [](const OrtCustomOp* this_, size_t index) { return static_cast<const TOp*>(this_)->GetOutputCharacteristic(index); };
2923
2924 OrtCustomOp::GetVariadicInputMinArity = [](const OrtCustomOp* this_) { return static_cast<const TOp*>(this_)->GetVariadicInputMinArity(); };
2925 OrtCustomOp::GetVariadicInputHomogeneity = [](const OrtCustomOp* this_) { return static_cast<int>(static_cast<const TOp*>(this_)->GetVariadicInputHomogeneity()); };
2926 OrtCustomOp::GetVariadicOutputMinArity = [](const OrtCustomOp* this_) { return static_cast<const TOp*>(this_)->GetVariadicOutputMinArity(); };
2927 OrtCustomOp::GetVariadicOutputHomogeneity = [](const OrtCustomOp* this_) { return static_cast<int>(static_cast<const TOp*>(this_)->GetVariadicOutputHomogeneity()); };
2928#ifdef __cpp_if_constexpr
2929 if constexpr (WithStatus) {
2930#else
2931 if (WithStatus) {
2932#endif
2933 OrtCustomOp::CreateKernelV2 = [](const OrtCustomOp* this_, const OrtApi* api, const OrtKernelInfo* info, void** op_kernel) -> OrtStatusPtr {
2934 return static_cast<const TOp*>(this_)->CreateKernelV2(*api, info, op_kernel);
2935 };
2936 OrtCustomOp::KernelComputeV2 = [](void* op_kernel, OrtKernelContext* context) -> OrtStatusPtr {
2937 return static_cast<TKernel*>(op_kernel)->ComputeV2(context);
2938 };
2939 } else {
2942
2943 OrtCustomOp::CreateKernel = [](const OrtCustomOp* this_, const OrtApi* api, const OrtKernelInfo* info) { return static_cast<const TOp*>(this_)->CreateKernel(*api, info); };
2944 OrtCustomOp::KernelCompute = [](void* op_kernel, OrtKernelContext* context) {
2945 static_cast<TKernel*>(op_kernel)->Compute(context);
2946 };
2947 }
2948
2949 SetShapeInferFn<TOp>(0);
2950
2951 OrtCustomOp::GetStartVersion = [](const OrtCustomOp* this_) {
2952 return static_cast<const TOp*>(this_)->start_ver_;
2953 };
2954
2955 OrtCustomOp::GetEndVersion = [](const OrtCustomOp* this_) {
2956 return static_cast<const TOp*>(this_)->end_ver_;
2957 };
2958
2961 OrtCustomOp::GetAliasMap = nullptr;
2963 }
2964
2965 // Default implementation of GetExecutionProviderType that returns nullptr to default to the CPU provider
2966 const char* GetExecutionProviderType() const { return nullptr; }
2967
2968 // Default implementations of GetInputCharacteristic() and GetOutputCharacteristic() below
2969 // (inputs and outputs are required by default)
2971 return OrtCustomOpInputOutputCharacteristic::INPUT_OUTPUT_REQUIRED;
2972 }
2973
2975 return OrtCustomOpInputOutputCharacteristic::INPUT_OUTPUT_REQUIRED;
2976 }
2977
2978 // Default implementation of GetInputMemoryType() that returns OrtMemTypeDefault
2979 OrtMemType GetInputMemoryType(size_t /*index*/) const {
2980 return OrtMemTypeDefault;
2981 }
2982
2983 // Default implementation of GetVariadicInputMinArity() returns 1 to specify that a variadic input
2984 // should expect at least 1 argument.
2986 return 1;
2987 }
2988
2989 // Default implementation of GetVariadicInputHomegeneity() returns true to specify that all arguments
2990 // to a variadic input should be of the same type.
2992 return true;
2993 }
2994
2995 // Default implementation of GetVariadicOutputMinArity() returns 1 to specify that a variadic output
2996 // should produce at least 1 output value.
2998 return 1;
2999 }
3000
3001 // Default implementation of GetVariadicOutputHomegeneity() returns true to specify that all output values
3002 // produced by a variadic output should be of the same type.
3004 return true;
3005 }
3006
3007 // Declare list of session config entries used by this Custom Op.
3008 // Implement this function in order to get configs from CustomOpBase::GetSessionConfigs().
3009 // This default implementation returns an empty vector of config entries.
3010 std::vector<std::string> GetSessionConfigKeys() const {
3011 return std::vector<std::string>{};
3012 }
3013
3014 // Ort::CustomOpBase derived class should provide the following static method with the type/shape inferencing
3015 // implementation if needed:
3016 // static OrtStatusPtr InferOutputShape(Ort::ShapeInferContext& context)
3017 template <typename C>
3018 decltype(&C::InferOutputShape) SetShapeInferFn(decltype(&C::InferOutputShape)) {
3020 ShapeInferContext ctx(&GetApi(), ort_ctx);
3021 return C::InferOutputShape(ctx);
3022 };
3023 return {};
3024 }
3025
3026 template <typename C>
3030
3031 protected:
3032 // Helper function that returns a map of session config entries specified by CustomOpBase::GetSessionConfigKeys.
3033 void GetSessionConfigs(std::unordered_map<std::string, std::string>& out, ConstSessionOptions options) const;
3034
3035 int start_ver_ = 1;
3036 int end_ver_ = MAX_CUSTOM_OP_END_VER;
3037};
3038
3039// Forward declaration to resolve circular dependency
3040// on ConstNode
3042
3043namespace detail {
3044template <typename T>
3046 using B = Base<T>;
3047 using B::B;
3048
3050 std::string GetName() const;
3056 std::vector<ValueInfoConsumerProducerInfo> GetConsumers() const;
3066 bool IsGraphOutput() const;
3070 bool IsFromOuterScope() const;
3071};
3072} // namespace detail
3073
3074// Const object holder that does not own the underlying object
3076
3081 ValueInfo() = default; // Same thing as with nullptr
3082 explicit ValueInfo(std::nullptr_t) {}
3084 explicit ValueInfo(OrtValueInfo* p) : ConstValueInfoImpl<OrtValueInfo>{p} {}
3085
3086#if !defined(ORT_MINIMAL_BUILD)
3087 // Create ValueInfo for a tensor
3088 explicit ValueInfo(const std::string& name, const ConstTypeInfo& type_info);
3089#endif
3090 ConstValueInfo GetConst() const { return ConstValueInfo{this->p_}; }
3091};
3092
3093// Forward declaration
3094struct AttrNameSubgraph;
3095
3096namespace detail {
3097// Forward decl
3098template <typename T>
3099struct ConstGraphImpl;
3100
3101template <typename T>
3102struct ConstNodeImpl : Base<T> {
3103 using B = Base<T>;
3104 using B::B;
3105
3106 // <Wraps OrtApi::Node_GetId
3107 size_t GetId() const;
3108 // <Wraps OrtApi::Node_GetName
3109 std::string GetName() const;
3110 // <Wraps OrtApi::Node_GetOperatorType
3111 std::string GetOperatorType() const;
3112 // <Wraps OrtApi::Node_GetDomain
3113 std::string GetDomain() const;
3114 // <Wraps OrtApi::Node_GetSinceVersion
3115 int GetSinceVersion() const;
3116
3117 // <Wraps OrtApi::Node_Inputs
3118 std::vector<ConstValueInfo> GetInputs() const;
3119 // <Wraps OrtApi::Node_Outputs
3120 std::vector<ConstValueInfo> GetOutputs() const;
3121 // <Wraps OrtApi::Node_ImplicitInputs
3122 std::vector<ConstValueInfo> GetImplicitInputs() const;
3123 // <Wraps OrtApi::Node_GetAttributes
3124 std::vector<ConstOpAttr> GetAttributes() const;
3125 // <Wraps OrtApi::Node_GetAttributeByName
3126 // Please, read C API doc for details
3127 Status GetAttributeByName(const std::string& name, ConstOpAttr& attr) const;
3128 // <Wraps OrtApi::Node_GetSubgraphs
3129 std::vector<AttrNameSubgraph> GetSubgraphs() const;
3130 // <Wraps OrtApi::Node_GetGraph
3131 // ConstGraph is not available yet
3133 // <Wraps OrtApi::Node_GetEpName
3134 std::string GetEpName() const;
3135};
3136} // namespace detail
3137
3139
3143struct Node : detail::ConstNodeImpl<OrtNode> {
3144 Node() = default; // Same thing as with nullptr
3145 explicit Node(std::nullptr_t) {}
3146 explicit Node(OrtNode* p) : ConstNodeImpl<OrtNode>{p} {}
3147
3148#if !defined(ORT_MINIMAL_BUILD)
3149 Node(const std::string& operator_name, const std::string& operator_domain,
3150 const std::string& node_name,
3151 const std::vector<std::string>& input_names,
3152 const std::vector<std::string>& output_names);
3153
3157 Node(const std::string& operator_name, const std::string& operator_domain,
3158 const std::string& node_name,
3159 const std::vector<std::string>& input_names,
3160 const std::vector<std::string>& output_names,
3161 std::vector<OpAttr>& attributes);
3162
3163 private:
3164 static void Init(const std::string& operator_name, const std::string& operator_domain,
3165 const std::string& node_name,
3166 const std::vector<std::string>& input_names,
3167 const std::vector<std::string>& output_names,
3168 std::vector<OpAttr>& attributes,
3169 OrtNode*& node);
3170#endif // !defined(ORT_MINIMAL_BUILD)
3171};
3172
3173// Return struct for some of ValueInfo APIs.
3174// Must be declared after ConstNode is available.
3177 // either producer output or consumer output index
3178 // producer is unsigned only, output can be -1
3179 int64_t index;
3180};
3181
3182// Represents a return value for Graph::GetOperatorSets()
3184 std::string domain;
3185 int64_t version;
3186};
3187
3188namespace detail {
3189template <typename T>
3191 using B = Base<T>;
3192 using B::B;
3193
3194 // <Wraps OrtApi::Graph_GetName
3195 std::string GetName() const;
3196 // <Wraps OrtApi::Graph_GetModelPath
3197 std::basic_string<ORTCHAR_T> GetModelPath() const;
3198 // <Wraps OrtApi::Graph_GetOnnxIRVersion
3199 int64_t GetOnnxIRVersion() const;
3200 // <Wraps OrtApi::Graph_GetOperatorSets
3201 std::vector<OperatorSet> GetOperatorSets() const;
3202 // <Wraps OrtApi::Graph_Inputs
3203 std::vector<ConstValueInfo> GetInputs() const;
3204 // <Wraps OrtApi::Graph_Outputs
3205 std::vector<ConstValueInfo> GetOutputs() const;
3206 // <Wraps OrtApi::Graph_Initializers
3207 std::vector<ConstValueInfo> GetInitializers() const;
3208 // <Wraps OrtApi::Graph_GetNodes
3209 std::vector<ConstNode> GetNodes() const;
3210 // <Wraps OrtApi::Graph_GetParentGraph
3212 // <Wraps OrtApi::Graph_GetGraphView
3213 Graph GetGraphView(const std::vector<ConstNode>& nodes) const;
3214 // <Wraps OrtApi::Graph_GetModelMetadata
3216};
3217
3218template <typename T>
3221 using B::B;
3222
3223#if !defined(ORT_MINIMAL_BUILD)
3224 // <Wraps GetModelEditorApi().SetGraphInputs()
3225 void SetInputs(std::vector<ValueInfo>& inputs);
3226 // <Wraps GetModelEditorApi().SetGraphOutputs()
3227 void SetOutputs(std::vector<ValueInfo>& outputs);
3228 // <Wraps GetModelEditorApi().AddInitializerToGraph()
3229 void AddInitializer(const std::string& name, Value& initializer, bool data_is_external); // Graph takes ownership of Value
3230 // <Wraps GetModelEditorApi().AddNodeToGraph()
3231 void AddNode(Node& node); // Graph takes ownership of Node
3232#endif // !defined(ORT_MINIMAL_BUILD)
3233};
3234} // namespace detail
3235
3237
3238// Return value for Node API
3239// Must be declared after ConstGraph
3244
3248struct Graph : detail::GraphImpl<OrtGraph> {
3249 explicit Graph(std::nullptr_t) {}
3250 explicit Graph(OrtGraph* p) : GraphImpl<OrtGraph>{p} {}
3251#if !defined(ORT_MINIMAL_BUILD)
3252 // <Wraps GetModelEditorApi().CreateGraph()
3254#endif
3255};
3256
3257namespace detail {
3258template <typename T>
3261 using B::B;
3262
3263#if !defined(ORT_MINIMAL_BUILD)
3264 // <Wraps GetModelEditorApi().AddGraphToModel()
3265 void AddGraph(Graph& graph);
3266#endif
3267};
3268} // namespace detail
3269
3270// Const object holder that does not own the underlying object
3272
3276struct Model : detail::ModelImpl<OrtModel> {
3277 using DomainOpsetPair = std::pair<std::string, int>;
3278
3279 explicit Model(std::nullptr_t) {}
3280 explicit Model(OrtModel* p) : ModelImpl<OrtModel>{p} {}
3281
3282#if !defined(ORT_MINIMAL_BUILD)
3283 //< Wraps GetModelEditorApi().CreateModel()
3284 explicit Model(const std::vector<DomainOpsetPair>& opsets);
3285#endif
3286};
3287} // namespace Ort
3288#include "onnxruntime_cxx_inline.h"
struct OrtMemoryInfo OrtMemoryInfo
Definition onnxruntime_c_api.h:296
struct OrtKernelInfo OrtKernelInfo
Definition onnxruntime_c_api.h:450
struct OrtNode OrtNode
Definition onnxruntime_c_api.h:324
OrtLoggingLevel
Logging severity levels.
Definition onnxruntime_c_api.h:246
OrtMemoryInfoDeviceType
This mimics OrtDevice type constants so they can be returned in the API.
Definition onnxruntime_c_api.h:485
struct OrtShapeInferContext OrtShapeInferContext
Definition onnxruntime_c_api.h:321
void(* OrtLoggingFunction)(void *param, OrtLoggingLevel severity, const char *category, const char *logid, const char *code_location, const char *message)
Definition onnxruntime_c_api.h:414
void(* OrtCustomJoinThreadFn)(OrtCustomThreadHandle ort_custom_thread_handle)
Custom thread join function.
Definition onnxruntime_c_api.h:938
OrtCustomOpInputOutputCharacteristic
Definition onnxruntime_c_api.h:6607
struct OrtTensorRTProviderOptionsV2 OrtTensorRTProviderOptionsV2
Definition onnxruntime_c_api.h:313
struct OrtEpApi OrtEpApi
Definition onnxruntime_c_api.h:882
struct OrtThreadingOptions OrtThreadingOptions
Definition onnxruntime_c_api.h:310
struct OrtSequenceTypeInfo OrtSequenceTypeInfo
Definition onnxruntime_c_api.h:304
struct OrtValueInfo OrtValueInfo
Definition onnxruntime_c_api.h:323
struct OrtDnnlProviderOptions OrtDnnlProviderOptions
Definition onnxruntime_c_api.h:317
OrtSparseIndicesFormat
Definition onnxruntime_c_api.h:235
struct OrtPrepackedWeightsContainer OrtPrepackedWeightsContainer
Definition onnxruntime_c_api.h:312
struct OrtSession OrtSession
Definition onnxruntime_c_api.h:298
OrtCompiledModelCompatibility
The C API.
Definition onnxruntime_c_api.h:961
OrtStatus *(* EpSelectionDelegate)(const OrtEpDevice **ep_devices, size_t num_devices, const OrtKeyValuePairs *model_metadata, const OrtKeyValuePairs *runtime_metadata, const OrtEpDevice **selected, size_t max_selected, size_t *num_selected, void *state)
Delegate to allow providing custom OrtEpDevice selection logic.
Definition onnxruntime_c_api.h:529
struct OrtCustomOpDomain OrtCustomOpDomain
Definition onnxruntime_c_api.h:307
struct OrtIoBinding OrtIoBinding
Definition onnxruntime_c_api.h:297
struct OrtExternalInitializerInfo OrtExternalInitializerInfo
Definition onnxruntime_c_api.h:332
OrtAllocatorType
Definition onnxruntime_c_api.h:456
struct OrtOp OrtOp
Definition onnxruntime_c_api.h:318
struct OrtTypeInfo OrtTypeInfo
Definition onnxruntime_c_api.h:301
struct OrtTensorTypeAndShapeInfo OrtTensorTypeAndShapeInfo
Definition onnxruntime_c_api.h:302
struct OrtCUDAProviderOptionsV2 OrtCUDAProviderOptionsV2
Definition onnxruntime_c_api.h:315
struct OrtKernelContext OrtKernelContext
Definition onnxruntime_c_api.h:452
struct OrtCANNProviderOptions OrtCANNProviderOptions
Definition onnxruntime_c_api.h:316
struct OrtEpDevice OrtEpDevice
Definition onnxruntime_c_api.h:329
void(* RunAsyncCallbackFn)(void *user_data, OrtValue **outputs, size_t num_outputs, OrtStatusPtr status)
Callback function for RunAsync.
Definition onnxruntime_c_api.h:949
OrtHardwareDeviceType
Definition onnxruntime_c_api.h:492
struct OrtModel OrtModel
Definition onnxruntime_c_api.h:326
struct OrtGraph OrtGraph
Definition onnxruntime_c_api.h:325
struct OrtSyncStream OrtSyncStream
Definition onnxruntime_c_api.h:331
struct OrtSessionOptions OrtSessionOptions
Definition onnxruntime_c_api.h:306
OrtDeviceMemoryType
This matches OrtDevice::MemoryType values.
Definition onnxruntime_c_api.h:478
struct OrtValue OrtValue
Definition onnxruntime_c_api.h:299
OrtStatus *(* OrtWriteBufferFunc)(void *state, const void *buffer, size_t buffer_num_bytes)
Function called by ORT to write a buffer to a custom destination (e.g., file, stream,...
Definition onnxruntime_c_api.h:548
GraphOptimizationLevel
Graph optimization level.
Definition onnxruntime_c_api.h:423
struct OrtKeyValuePairs OrtKeyValuePairs
Definition onnxruntime_c_api.h:330
OrtStatus * OrtStatusPtr
Definition onnxruntime_c_api.h:337
OrtMemType
Memory types for allocated memory, execution provider specific types should be extended in each provi...
Definition onnxruntime_c_api.h:466
OrtSparseFormat
Definition onnxruntime_c_api.h:227
ONNXType
Definition onnxruntime_c_api.h:215
struct OrtEnv OrtEnv
Definition onnxruntime_c_api.h:294
OrtErrorCode
Definition onnxruntime_c_api.h:254
struct OrtStatus OrtStatus
Definition onnxruntime_c_api.h:295
OrtStatus *(* OrtGetInitializerLocationFunc)(void *state, const char *initializer_name, const OrtValue *initializer_value, const OrtExternalInitializerInfo *external_info, OrtExternalInitializerInfo **new_external_info)
Function called by ORT to allow user to specify how an initializer should be saved,...
Definition onnxruntime_c_api.h:582
#define ORT_API_VERSION
The API version defined in this header.
Definition onnxruntime_c_api.h:41
struct OrtLogger OrtLogger
Definition onnxruntime_c_api.h:320
struct OrtMapTypeInfo OrtMapTypeInfo
Definition onnxruntime_c_api.h:303
struct OrtArenaCfg OrtArenaCfg
Definition onnxruntime_c_api.h:311
ExecutionMode
Definition onnxruntime_c_api.h:431
OrtOpAttrType
Definition onnxruntime_c_api.h:272
OrtCustomThreadHandle(* OrtCustomCreateThreadFn)(void *ort_custom_thread_creation_options, OrtThreadWorkerFn ort_thread_worker_fn, void *ort_worker_fn_param)
Ort custom thread creation function.
Definition onnxruntime_c_api.h:931
ONNXTensorElementDataType
Definition onnxruntime_c_api.h:184
OrtExecutionProviderDevicePolicy
These are the default EP selection policies used by ORT when doing automatic EP selection.
Definition onnxruntime_c_api.h:500
const OrtApiBase * OrtGetApiBase(void)
The Onnxruntime library's entry point to access the C API.
@ ORT_LOGGING_LEVEL_WARNING
Warning messages.
Definition onnxruntime_c_api.h:249
@ OrtMemTypeDefault
The default allocator for execution provider.
Definition onnxruntime_c_api.h:474
@ ORT_FAIL
Definition onnxruntime_c_api.h:256
@ ONNX_TENSOR_ELEMENT_DATA_TYPE_FLOAT
Definition onnxruntime_c_api.h:186
std::vector< Value > GetOutputValuesHelper(const OrtIoBinding *binding, OrtAllocator *)
std::vector< std::string > GetOutputNamesHelper(const OrtIoBinding *binding, OrtAllocator *)
void OrtRelease(OrtAllocator *ptr)
Definition onnxruntime_cxx_api.h:615
std::string MakeCustomOpConfigEntryKey(const char *custom_op_name, const char *config)
All C++ Onnxruntime APIs are defined inside this namespace.
Definition onnxruntime_cxx_api.h:48
const OrtModelEditorApi & GetModelEditorApi()
This returns a reference to the ORT C Model Editor API. Used if building or augmenting a model at run...
Definition onnxruntime_cxx_api.h:215
std::unique_ptr< char, detail::AllocatedFree > AllocatedStringPtr
unique_ptr typedef used to own strings allocated by OrtAllocators and release them at the end of the ...
Definition onnxruntime_cxx_api.h:788
detail::ConstSessionOptionsImpl< detail::Unowned< const OrtSessionOptions > > ConstSessionOptions
Definition onnxruntime_cxx_api.h:1448
detail::KernelInfoImpl< detail::Unowned< const OrtKernelInfo > > ConstKernelInfo
Definition onnxruntime_cxx_api.h:2775
const OrtApi & GetApi() noexcept
This returns a reference to the ORT C API.
Definition onnxruntime_cxx_api.h:189
const OrtCompileApi & GetCompileApi()
This returns a reference to the ORT C Compile API. Used if compiling a model at runtime.
Definition onnxruntime_cxx_api.h:229
detail::AllocatorImpl< detail::Unowned< OrtAllocator > > UnownedAllocator
Definition onnxruntime_cxx_api.h:1061
OrtCompiledModelCompatibility GetModelCompatibilityForEpDevices(const std::vector< ConstEpDevice > &ep_devices, const char *compatibility_info)
Validate a compiled model's compatibility for one or more EP devices.
detail::SessionOptionsImpl< detail::Unowned< OrtSessionOptions > > UnownedSessionOptions
Definition onnxruntime_cxx_api.h:1447
std::string GetBuildInfoString()
This function returns the onnxruntime build information: including git branch, git commit id,...
const OrtEpApi & GetEpApi()
This returns a reference to the ORT C EP API. Used if authoring a plugin execution provider.
Definition onnxruntime_cxx_api.h:243
std::string GetVersionString()
This function returns the onnxruntime version string.
std::vector< std::string > GetAvailableProviders()
This is a C++ wrapper for OrtApi::GetAvailableProviders() and returns a vector of strings representin...
Ort::Status(*)(Ort::ShapeInferContext &) ShapeInferFn
Definition onnxruntime_cxx_api.h:2894
Status CompileModel(const Env &env, const ModelCompilationOptions &model_compilation_options)
Compiles an input model to generate a model with EPContext nodes that execute EP-specific kernels....
Wrapper around OrtAllocator.
Definition onnxruntime_cxx_api.h:1056
Allocator(const Session &session, const OrtMemoryInfo *)
Allocator(std::nullptr_t)
Convenience to create a class member and then replace with an instance.
Definition onnxruntime_cxx_api.h:1057
Wrapper around OrtAllocator default instance that is owned by Onnxruntime.
Definition onnxruntime_cxx_api.h:1047
AllocatorWithDefaultOptions(std::nullptr_t)
Convenience to create a class member and then replace with an instance.
Definition onnxruntime_cxx_api.h:1048
it is a structure that represents the configuration of an arena based allocator
Definition onnxruntime_cxx_api.h:2480
ArenaCfg(std::nullptr_t)
Create an empty ArenaCfg object, must be assigned a valid one to be used.
Definition onnxruntime_cxx_api.h:2481
ArenaCfg(const std::unordered_map< std::string, size_t > &arena_config)
ArenaCfg(size_t max_mem, int arena_extend_strategy, int initial_chunk_size_bytes, int max_dead_bytes_per_chunk)
Definition onnxruntime_cxx_api.h:3240
ConstGraph sub_graph
Definition onnxruntime_cxx_api.h:3242
std::string attr_name
Definition onnxruntime_cxx_api.h:3241
bfloat16 (Brain Floating Point) data type
Definition onnxruntime_cxx_api.h:413
bool operator==(const BFloat16_t &rhs) const noexcept
onnxruntime_float16::BFloat16Impl< BFloat16_t > Base
Definition onnxruntime_cxx_api.h:425
BFloat16_t()=default
static constexpr BFloat16_t FromBits(uint16_t v) noexcept
Explicit conversion to uint16_t representation of bfloat16.
Definition onnxruntime_cxx_api.h:434
bool operator!=(const BFloat16_t &rhs) const noexcept
Definition onnxruntime_cxx_api.h:532
BFloat16_t(float v) noexcept
__ctor from float. Float is converted into bfloat16 16-bit representation.
Definition onnxruntime_cxx_api.h:440
float ToFloat() const noexcept
Converts bfloat16 to float.
Definition onnxruntime_cxx_api.h:446
bool operator<(const BFloat16_t &rhs) const noexcept
The CUDAProviderOptions (V2)
Definition onnxruntime_cxx_api.h:859
CUDAProviderOptions()
Wraps OrtApi::CreateCUDAProviderOptions.
CUDAProviderOptions(std::nullptr_t)
Definition onnxruntime_cxx_api.h:860
void UpdateWithValue(const char *key, void *value)
Wrapper around OrtApi::GetCUDAProviderOptionsByName.
std::string GetCUDAProviderOptionsAsString() const
Wrapper around OrtApi::UpdateCUDAProviderOptionsWithValue.
void Update(const std::unordered_map< std::string, std::string > &options)
Wrapper around OrtApi::GetCUDAProviderOptionsAsString.
void * GetOptionByName(const char *name) const
Definition onnxruntime_cxx_api.h:2899
OrtCustomOpInputOutputCharacteristic GetOutputCharacteristic(size_t) const
Definition onnxruntime_cxx_api.h:2974
OrtCustomOpInputOutputCharacteristic GetInputCharacteristic(size_t) const
Definition onnxruntime_cxx_api.h:2970
OrtMemType GetInputMemoryType(size_t) const
Definition onnxruntime_cxx_api.h:2979
std::vector< std::string > GetSessionConfigKeys() const
Definition onnxruntime_cxx_api.h:3010
bool GetVariadicInputHomogeneity() const
Definition onnxruntime_cxx_api.h:2991
int GetVariadicInputMinArity() const
Definition onnxruntime_cxx_api.h:2985
void SetShapeInferFn(...)
Definition onnxruntime_cxx_api.h:3027
CustomOpBase()
Definition onnxruntime_cxx_api.h:2900
bool GetVariadicOutputHomogeneity() const
Definition onnxruntime_cxx_api.h:3003
int GetVariadicOutputMinArity() const
Definition onnxruntime_cxx_api.h:2997
decltype(&C::InferOutputShape) SetShapeInferFn(decltype(&C::InferOutputShape))
Definition onnxruntime_cxx_api.h:3018
const char * GetExecutionProviderType() const
Definition onnxruntime_cxx_api.h:2966
void GetSessionConfigs(std::unordered_map< std::string, std::string > &out, ConstSessionOptions options) const
Class that represents session configuration entries for one or more custom operators.
Definition onnxruntime_cxx_api.h:1304
~CustomOpConfigs()=default
CustomOpConfigs & AddConfig(const char *custom_op_name, const char *config_key, const char *config_value)
Adds a session configuration entry/value for a specific custom operator.
CustomOpConfigs & operator=(CustomOpConfigs &&o)=default
CustomOpConfigs(CustomOpConfigs &&o)=default
CustomOpConfigs()=default
const std::unordered_map< std::string, std::string > & GetFlattenedConfigs() const
Returns a flattened map of custom operator configuration entries and their values.
CustomOpConfigs(const CustomOpConfigs &)=default
CustomOpConfigs & operator=(const CustomOpConfigs &)=default
Custom Op Domain.
Definition onnxruntime_cxx_api.h:1209
CustomOpDomain(std::nullptr_t)
Create an empty CustomOpDomain object, must be assigned a valid one to be used.
Definition onnxruntime_cxx_api.h:1213
CustomOpDomain(const char *domain)
Wraps OrtApi::CreateCustomOpDomain.
void Add(const OrtCustomOp *op)
Wraps CustomOpDomain_Add.
The Env (Environment)
Definition onnxruntime_cxx_api.h:1152
Env & EnableTelemetryEvents()
Wraps OrtApi::EnableTelemetryEvents.
Env(OrtEnv *p)
C Interop Helper.
Definition onnxruntime_cxx_api.h:1169
Env & CreateAndRegisterAllocatorV2(const std::string &provider_type, const OrtMemoryInfo *mem_info, const std::unordered_map< std::string, std::string > &options, const OrtArenaCfg *arena_cfg)
Wraps OrtApi::CreateAndRegisterAllocatorV2.
Env & UnregisterExecutionProviderLibrary(const char *registration_name)
Wraps OrtApi::UnregisterExecutionProviderLibrary.
std::vector< ConstEpDevice > GetEpDevices() const
Env & UnregisterAllocator(const OrtMemoryInfo *mem_info)
Wraps OrtApi::UnregisterAllocator.
Env(std::nullptr_t)
Create an empty Env object, must be assigned a valid one to be used.
Definition onnxruntime_cxx_api.h:1153
Env(OrtLoggingLevel logging_level=ORT_LOGGING_LEVEL_WARNING, const char *logid="")
Wraps OrtApi::CreateEnv.
Env(const OrtThreadingOptions *tp_options, OrtLoggingLevel logging_level=ORT_LOGGING_LEVEL_WARNING, const char *logid="")
Wraps OrtApi::CreateEnvWithGlobalThreadPools.
Env(const OrtThreadingOptions *tp_options, OrtLoggingFunction logging_function, void *logger_param, OrtLoggingLevel logging_level=ORT_LOGGING_LEVEL_WARNING, const char *logid="")
Wraps OrtApi::CreateEnvWithCustomLoggerAndGlobalThreadPools.
Env & RegisterAllocator(OrtAllocator *allocator)
Wraps OrtApi::RegisterAllocator.
UnownedAllocator CreateSharedAllocator(const OrtEpDevice *ep_device, OrtDeviceMemoryType mem_type, OrtAllocatorType allocator_type, const OrtKeyValuePairs *allocator_options)
Wraps OrtApi::CreateSharedAllocator.
Env(OrtLoggingLevel logging_level, const char *logid, OrtLoggingFunction logging_function, void *logger_param)
Wraps OrtApi::CreateEnvWithCustomLogger.
Env & CreateAndRegisterAllocator(const OrtMemoryInfo *mem_info, const OrtArenaCfg *arena_cfg)
Wraps OrtApi::CreateAndRegisterAllocator.
UnownedAllocator GetSharedAllocator(const OrtMemoryInfo *mem_info)
Wraps OrtApi::GetSharedAllocator.
Env & RegisterExecutionProviderLibrary(const char *registration_name, const std::basic_string< char > &path)
Wraps OrtApi::RegisterExecutionProviderLibrary.
Env & UpdateEnvWithCustomLogLevel(OrtLoggingLevel log_severity_level)
Wraps OrtApi::UpdateEnvWithCustomLogLevel.
Status CopyTensors(const std::vector< Value > &src_tensors, const std::vector< Value > &dst_tensors, OrtSyncStream *stream) const
Wraps OrtApi::CopyTensors.
void ReleaseSharedAllocator(const OrtEpDevice *ep_device, OrtDeviceMemoryType mem_type)
Wraps OrtApi::ReleaseSharedAllocator.
Env & DisableTelemetryEvents()
Wraps OrtApi::DisableTelemetryEvents.
Mutable EpDevice that is created by EpApi users.
Definition onnxruntime_cxx_api.h:1128
EpDevice(OrtEpDevice *p)
Take ownership of a pointer created by C API.
Definition onnxruntime_cxx_api.h:1130
EpDevice(OrtEpFactory &ep_factory, ConstHardwareDevice &hardware_device, ConstKeyValuePairs ep_metadata={}, ConstKeyValuePairs ep_options={})
Wraps OrtEpApi::CreateEpDevice.
EpDevice(std::nullptr_t)
No instance is created.
Definition onnxruntime_cxx_api.h:1129
All C++ methods that can fail will throw an exception of this type.
Definition onnxruntime_cxx_api.h:54
const char * what() const noexcept override
Definition onnxruntime_cxx_api.h:59
Exception(const std::string &string, OrtErrorCode code)
Definition onnxruntime_cxx_api.h:55
OrtErrorCode GetOrtErrorCode() const
Definition onnxruntime_cxx_api.h:58
Exception(std::string &&string, OrtErrorCode code)
Definition onnxruntime_cxx_api.h:56
Wrapper around OrtExternalInitializerInfo.
Definition onnxruntime_cxx_api.h:910
ConstExternalInitializerInfo GetConst() const
Wraps OrtApi::CreateExternalInitializerInfo.
Definition onnxruntime_cxx_api.h:918
ExternalInitializerInfo(const char *filepath, int64_t file_offset, size_t byte_size)
Wrapper around CreateExternalInitializerInfo that does not throw an exception.
ExternalInitializerInfo(std::nullptr_t)
Definition onnxruntime_cxx_api.h:914
ExternalInitializerInfo(OrtExternalInitializerInfo *p)
Definition onnxruntime_cxx_api.h:915
static Status Create(const char *filepath, int64_t file_offset, size_t byte_size, ExternalInitializerInfo &out)
IEEE 754 half-precision floating point data type.
Definition onnxruntime_cxx_api.h:271
Float16_t()=default
Default constructor.
Float16_t(float v) noexcept
__ctor from float. Float is converted into float16 16-bit representation.
Definition onnxruntime_cxx_api.h:299
onnxruntime_float16::Float16Impl< Float16_t > Base
Definition onnxruntime_cxx_api.h:281
float ToFloat() const noexcept
Converts float16 to float.
Definition onnxruntime_cxx_api.h:305
static constexpr Float16_t FromBits(uint16_t v) noexcept
Explicit conversion to uint16_t representation of float16.
Definition onnxruntime_cxx_api.h:293
float8e4m3fn (Float8 Floating Point) data type
Definition onnxruntime_cxx_api.h:543
uint8_t value
Definition onnxruntime_cxx_api.h:544
constexpr Float8E4M3FN_t(uint8_t v) noexcept
Definition onnxruntime_cxx_api.h:546
constexpr bool operator==(const Float8E4M3FN_t &rhs) const noexcept
Definition onnxruntime_cxx_api.h:549
constexpr Float8E4M3FN_t() noexcept
Definition onnxruntime_cxx_api.h:545
constexpr bool operator!=(const Float8E4M3FN_t &rhs) const noexcept
Definition onnxruntime_cxx_api.h:550
float8e4m3fnuz (Float8 Floating Point) data type
Definition onnxruntime_cxx_api.h:560
constexpr bool operator==(const Float8E4M3FNUZ_t &rhs) const noexcept
Definition onnxruntime_cxx_api.h:566
uint8_t value
Definition onnxruntime_cxx_api.h:561
constexpr Float8E4M3FNUZ_t() noexcept
Definition onnxruntime_cxx_api.h:562
constexpr bool operator!=(const Float8E4M3FNUZ_t &rhs) const noexcept
Definition onnxruntime_cxx_api.h:567
constexpr Float8E4M3FNUZ_t(uint8_t v) noexcept
Definition onnxruntime_cxx_api.h:563
float8e5m2 (Float8 Floating Point) data type
Definition onnxruntime_cxx_api.h:577
constexpr Float8E5M2_t(uint8_t v) noexcept
Definition onnxruntime_cxx_api.h:580
uint8_t value
Definition onnxruntime_cxx_api.h:578
constexpr bool operator!=(const Float8E5M2_t &rhs) const noexcept
Definition onnxruntime_cxx_api.h:584
constexpr Float8E5M2_t() noexcept
Definition onnxruntime_cxx_api.h:579
constexpr bool operator==(const Float8E5M2_t &rhs) const noexcept
Definition onnxruntime_cxx_api.h:583
float8e5m2fnuz (Float8 Floating Point) data type
Definition onnxruntime_cxx_api.h:594
constexpr Float8E5M2FNUZ_t() noexcept
Definition onnxruntime_cxx_api.h:596
constexpr Float8E5M2FNUZ_t(uint8_t v) noexcept
Definition onnxruntime_cxx_api.h:597
constexpr bool operator!=(const Float8E5M2FNUZ_t &rhs) const noexcept
Definition onnxruntime_cxx_api.h:601
constexpr bool operator==(const Float8E5M2FNUZ_t &rhs) const noexcept
Definition onnxruntime_cxx_api.h:600
uint8_t value
Definition onnxruntime_cxx_api.h:595
Wrapper around OrtGraph.
Definition onnxruntime_cxx_api.h:3248
Graph(OrtGraph *p)
Take ownership of a pointer created by C API.
Definition onnxruntime_cxx_api.h:3250
Graph(std::nullptr_t)
No instance is created.
Definition onnxruntime_cxx_api.h:3249
Wrapper around OrtIoBinding.
Definition onnxruntime_cxx_api.h:2469
UnownedIoBinding GetUnowned() const
Definition onnxruntime_cxx_api.h:2473
ConstIoBinding GetConst() const
Definition onnxruntime_cxx_api.h:2472
IoBinding(Session &session)
IoBinding(std::nullptr_t)
Create an empty object for convenience. Sometimes, we want to initialize members later.
Definition onnxruntime_cxx_api.h:2470
This class wraps a raw pointer OrtKernelContext* that is being passed to the custom kernel Compute() ...
Definition onnxruntime_cxx_api.h:2703
KernelContext(OrtKernelContext *context)
Logger GetLogger() const
ConstValue GetInput(size_t index) const
OrtKernelContext * GetOrtKernelContext() const
Definition onnxruntime_cxx_api.h:2717
void ParallelFor(void(*fn)(void *, size_t), size_t total, size_t num_batch, void *usr_data) const
OrtAllocator * GetAllocator(const OrtMemoryInfo &memory_info) const
void * GetGPUComputeStream() const
size_t GetInputCount() const
size_t GetOutputCount() const
UnownedValue GetOutput(size_t index, const std::vector< int64_t > &dims) const
UnownedValue GetOutput(size_t index, const int64_t *dim_values, size_t dim_count) const
This struct owns the OrtKernInfo* pointer when a copy is made. For convenient wrapping of OrtKernelIn...
Definition onnxruntime_cxx_api.h:2783
KernelInfo(OrtKernelInfo *info)
Take ownership of the instance.
ConstKernelInfo GetConst() const
Definition onnxruntime_cxx_api.h:2788
detail::KernelInfoImpl< OrtKernelInfo > Base
Definition onnxruntime_cxx_api.h:2784
KernelInfo(std::nullptr_t)
Create an empty instance to initialize later.
Definition onnxruntime_cxx_api.h:2786
Wrapper around OrtKeyValuePairs.
Definition onnxruntime_cxx_api.h:947
KeyValuePairs()
Wraps OrtApi::CreateKeyValuePairs.
void Add(const char *key, const char *value)
Wraps OrtApi::AddKeyValuePair.
KeyValuePairs(const std::unordered_map< std::string, std::string > &kv_pairs)
Wraps OrtApi::CreateKeyValuePairs and OrtApi::AddKeyValuePair.
void Remove(const char *key)
Wraps OrtApi::RemoveKeyValuePair.
KeyValuePairs(std::nullptr_t)
Definition onnxruntime_cxx_api.h:948
ConstKeyValuePairs GetConst() const
Definition onnxruntime_cxx_api.h:964
KeyValuePairs(OrtKeyValuePairs *p)
Take ownership of a pointer created by C API.
Definition onnxruntime_cxx_api.h:950
This class represents an ONNX Runtime logger that can be used to log information with an associated s...
Definition onnxruntime_cxx_api.h:2625
Logger(Logger &&v) noexcept=default
Logger & operator=(Logger &&v) noexcept=default
Logger & operator=(const Logger &)=default
~Logger()=default
Logger(const Logger &)=default
Logger()=default
Logger(std::nullptr_t)
Definition onnxruntime_cxx_api.h:2634
Logger(const OrtLogger *logger)
OrtLoggingLevel GetLoggingSeverityLevel() const noexcept
LoraAdapter holds a set of Lora Parameters loaded from a single file.
Definition onnxruntime_cxx_api.h:1223
static LoraAdapter CreateLoraAdapter(const std::basic_string< char > &adapter_path, OrtAllocator *allocator)
Wraps OrtApi::CreateLoraAdapter.
LoraAdapter(std::nullptr_t)
Definition onnxruntime_cxx_api.h:1227
static LoraAdapter CreateLoraAdapterFromArray(const void *bytes, size_t num_bytes, OrtAllocator *allocator)
Wraps OrtApi::CreateLoraAdapterFromArray.
Wrapper around OrtMapTypeInfo.
Definition onnxruntime_cxx_api.h:1868
ConstMapTypeInfo GetConst() const
Definition onnxruntime_cxx_api.h:1874
MapTypeInfo(OrtMapTypeInfo *p)
Used for interop with the C API.
Definition onnxruntime_cxx_api.h:1873
MapTypeInfo(std::nullptr_t)
Create an empty MapTypeInfo object, must be assigned a valid one to be used.
Definition onnxruntime_cxx_api.h:1872
Represents native memory allocation coming from one of the OrtAllocators registered with OnnxRuntime....
Definition onnxruntime_cxx_api.h:1008
MemoryAllocation(MemoryAllocation &&) noexcept
MemoryAllocation & operator=(const MemoryAllocation &)=delete
MemoryAllocation(const MemoryAllocation &)=delete
MemoryAllocation(OrtAllocator *allocator, void *p, size_t size)
size_t size() const
Definition onnxruntime_cxx_api.h:1017
Wrapper around OrtMemoryInfo.
Definition onnxruntime_cxx_api.h:992
MemoryInfo(const char *name, OrtAllocatorType type, int id, OrtMemType mem_type)
MemoryInfo(std::nullptr_t)
No instance is created.
Definition onnxruntime_cxx_api.h:994
MemoryInfo(OrtMemoryInfo *p)
Take ownership of a pointer created by C API.
Definition onnxruntime_cxx_api.h:995
static MemoryInfo CreateCpu(OrtAllocatorType type, OrtMemType mem_type1)
ConstMemoryInfo GetConst() const
Definition onnxruntime_cxx_api.h:999
MemoryInfo(const char *name, OrtMemoryInfoDeviceType device_type, uint32_t vendor_id, uint32_t device_id, OrtDeviceMemoryType mem_type, size_t alignment, OrtAllocatorType allocator_type)
Wrapper around CreateMemoryInfo_V2.
Options object used when compiling a model.
Definition onnxruntime_cxx_api.h:1465
ModelCompilationOptions & SetOutputModelWriteFunc(OrtWriteBufferFunc write_func, void *state)
ModelCompilationOptions & SetEpContextEmbedMode(bool embed_ep_context_in_model)
Wraps OrtApi::ModelCompilationOptions_SetEpContextEmbedMode.
ModelCompilationOptions & SetInputModelFromBuffer(const void *input_model_data, size_t input_model_data_size)
Wraps OrtApi::ModelCompilationOptions_SetInputModelFromBuffer.
ModelCompilationOptions & SetOutputModelBuffer(OrtAllocator *allocator, void **output_model_buffer_ptr, size_t *output_model_buffer_size_ptr)
Wraps OrtApi::ModelCompilationOptions_SetOutputModelBuffer.
ModelCompilationOptions & SetFlags(uint32_t flags)
Wraps OrtApi::ModelCompilationOptions_SetFlags.
ModelCompilationOptions & SetOutputModelExternalInitializersFile(const char *file_path, size_t initializer_size_threshold)
Wraps OrtApi::ModelCompilationOptions_SetOutputModelExternalInitializersFile.
ModelCompilationOptions(std::nullptr_t)
Create an empty ModelCompilationOptions object, must be assigned a valid one to be used.
Definition onnxruntime_cxx_api.h:1469
ModelCompilationOptions(const Env &env, ConstSessionOptions session_options)
Wraps OrtApi::CreateModelCompilationOptionsFromSessionOptions.
ModelCompilationOptions & SetOutputModelPath(const char *output_model_path)
Wraps OrtApi::ModelCompilationOptions_SetOutputModelPath.
ModelCompilationOptions & SetInputModelPath(const char *input_model_path)
Wraps OrtApi::ModelCompilationOptions_SetInputModelPath.
ModelCompilationOptions & SetOutputModelGetInitializerLocationFunc(OrtGetInitializerLocationFunc get_initializer_location_func, void *state)
ModelCompilationOptions & SetEpContextBinaryInformation(const char *output_directory, const char *model_name)
Wraps OrtApi::ModelCompilationOptions_SetEpContextBinaryInformation.
ModelCompilationOptions & SetGraphOptimizationLevel(GraphOptimizationLevel graph_optimization_level)
Wraps OrtApi::ModelCompilationOptions_SetGraphOptimizationLevel.
ModelCompilationOptions(const Env &env, const SessionOptions &session_options)
Wraps OrtApi::CreateModelCompilationOptionsFromSessionOptions.
Wrapper around OrtModel.
Definition onnxruntime_cxx_api.h:3276
Model(const std::vector< DomainOpsetPair > &opsets)
Model(OrtModel *p)
Take ownership of a pointer created by C API.
Definition onnxruntime_cxx_api.h:3280
std::pair< std::string, int > DomainOpsetPair
Definition onnxruntime_cxx_api.h:3277
Model(std::nullptr_t)
No instance is created.
Definition onnxruntime_cxx_api.h:3279
Wrapper around OrtModelMetadata.
Definition onnxruntime_cxx_api.h:1511
AllocatedStringPtr GetDescriptionAllocated(OrtAllocator *allocator) const
Returns a copy of the description.
std::vector< AllocatedStringPtr > GetCustomMetadataMapKeysAllocated(OrtAllocator *allocator) const
Returns a vector of copies of the custom metadata keys.
ModelMetadata(std::nullptr_t)
Create an empty ModelMetadata object, must be assigned a valid one to be used.
Definition onnxruntime_cxx_api.h:1515
AllocatedStringPtr GetGraphDescriptionAllocated(OrtAllocator *allocator) const
Returns a copy of the graph description.
AllocatedStringPtr GetProducerNameAllocated(OrtAllocator *allocator) const
Returns a copy of the producer name.
AllocatedStringPtr GetGraphNameAllocated(OrtAllocator *allocator) const
Returns a copy of the graph name.
AllocatedStringPtr LookupCustomMetadataMapAllocated(const char *key, OrtAllocator *allocator) const
Looks up a value by a key in the Custom Metadata map.
AllocatedStringPtr GetDomainAllocated(OrtAllocator *allocator) const
Returns a copy of the domain name.
int64_t GetVersion() const
Wraps OrtApi::ModelMetadataGetVersion.
Wrapper around OrtNode.
Definition onnxruntime_cxx_api.h:3143
Node(const std::string &operator_name, const std::string &operator_domain, const std::string &node_name, const std::vector< std::string > &input_names, const std::vector< std::string > &output_names)
Node()=default
Node(std::nullptr_t)
No instance is created.
Definition onnxruntime_cxx_api.h:3145
Node(const std::string &operator_name, const std::string &operator_domain, const std::string &node_name, const std::vector< std::string > &input_names, const std::vector< std::string > &output_names, std::vector< OpAttr > &attributes)
Wraps CreateNode. Node takes ownership of attributes on success and updates the OpAttr in attributes ...
Node(OrtNode *p)
Take ownership of a pointer created by C API.
Definition onnxruntime_cxx_api.h:3146
This struct provides life time management for custom op attribute.
Definition onnxruntime_cxx_api.h:2534
OpAttr(const char *name, const void *data, int len, OrtOpAttrType type)
OpAttr()=default
OpAttr(std::nullptr_t)
Definition onnxruntime_cxx_api.h:2539
ConstOpAttr GetConst() const
Definition onnxruntime_cxx_api.h:2542
Create and own custom defined operation.
Definition onnxruntime_cxx_api.h:2794
Op(OrtOp *)
Take ownership of the OrtOp.
static Op Create(const OrtKernelInfo *info, const char *op_name, const char *domain, int version, const char **type_constraint_names, const ONNXTensorElementDataType *type_constraint_values, size_t type_constraint_count, const OpAttr *attr_values, size_t attr_count, size_t input_count, size_t output_count)
Op(std::nullptr_t)
Create an empty Operator object, must be assigned a valid one to be used.
Definition onnxruntime_cxx_api.h:2798
void Invoke(const OrtKernelContext *context, const OrtValue *const *input_values, size_t input_count, OrtValue *const *output_values, size_t output_count)
void Invoke(const OrtKernelContext *context, const Value *input_values, size_t input_count, Value *output_values, size_t output_count)
Definition onnxruntime_cxx_api.h:3183
std::string domain
Definition onnxruntime_cxx_api.h:3184
int64_t version
Definition onnxruntime_cxx_api.h:3185
The PrepackedWeightsContainer.
Definition onnxruntime_cxx_api.h:878
PrepackedWeightsContainer()
Wraps OrtApi::CreatePrepackedWeightsContainer.
PrepackedWeightsContainer(OrtPrepackedWeightsContainer *p)
Definition onnxruntime_cxx_api.h:883
PrepackedWeightsContainer(std::nullptr_t)
Take ownership of a pointer created by C API.
Definition onnxruntime_cxx_api.h:881
RunOptions.
Definition onnxruntime_cxx_api.h:1251
int GetRunLogSeverityLevel() const
Wraps OrtApi::RunOptionsGetRunLogSeverityLevel.
RunOptions & SetTerminate()
Terminates all currently executing Session::Run calls that were made using this RunOptions instance.
RunOptions & SetRunTag(const char *run_tag)
wraps OrtApi::RunOptionsSetRunTag
RunOptions & AddActiveLoraAdapter(const LoraAdapter &adapter)
Add the LoraAdapter to the list of active adapters. The setting does not affect RunWithBinding() call...
RunOptions & UnsetTerminate()
Clears the terminate flag so this RunOptions instance can be used in a new Session::Run call without ...
int GetRunLogVerbosityLevel() const
Wraps OrtApi::RunOptionsGetRunLogVerbosityLevel.
RunOptions(std::nullptr_t)
Create an empty RunOptions object, must be assigned a valid one to be used.
Definition onnxruntime_cxx_api.h:1252
RunOptions & SetRunLogVerbosityLevel(int)
Wraps OrtApi::RunOptionsSetRunLogVerbosityLevel.
RunOptions & SetRunLogSeverityLevel(int)
Wraps OrtApi::RunOptionsSetRunLogSeverityLevel.
RunOptions & AddConfigEntry(const char *config_key, const char *config_value)
Wraps OrtApi::AddRunConfigEntry.
const char * GetRunTag() const
Wraps OrtApi::RunOptionsGetRunTag.
RunOptions()
Wraps OrtApi::CreateRunOptions.
const char * GetConfigEntry(const char *config_key)
Wraps OrtApi::GetRunConfigEntry.
Wrapper around OrtSequenceTypeInfo.
Definition onnxruntime_cxx_api.h:1830
SequenceTypeInfo(std::nullptr_t)
Create an empty SequenceTypeInfo object, must be assigned a valid one to be used.
Definition onnxruntime_cxx_api.h:1834
ConstSequenceTypeInfo GetConst() const
Definition onnxruntime_cxx_api.h:1836
SequenceTypeInfo(OrtSequenceTypeInfo *p)
Used for interop with the C API.
Definition onnxruntime_cxx_api.h:1835
Wrapper around OrtSession.
Definition onnxruntime_cxx_api.h:1731
Session(std::nullptr_t)
Create an empty Session object, must be assigned a valid one to be used. Wraps OrtApi::CreateSession.
Definition onnxruntime_cxx_api.h:1733
static Session CreateModelEditorSession(const Env &env, const void *model_data, size_t model_data_length, const SessionOptions &options)
Wraps OrtModelEditorApi::CreateModelEditorSession.
UnownedSession GetUnowned() const
Definition onnxruntime_cxx_api.h:1762
Session(const Env &env, const char *model_path, const SessionOptions &options, OrtPrepackedWeightsContainer *prepacked_weights_container)
Wraps OrtApi::CreateSessionWithPrepackedWeightsContainer.
Session(const Env &env, const void *model_data, size_t model_data_length, const SessionOptions &options, OrtPrepackedWeightsContainer *prepacked_weights_container)
Wraps OrtApi::CreateSessionFromArrayWithPrepackedWeightsContainer.
Session(const Env &env, const Model &model, const SessionOptions &options)
Wraps OrtModelEditorApi::CreateSessionFromModel.
Session(OrtSession *p)
C API Interop.
Definition onnxruntime_cxx_api.h:1734
static Session CreateModelEditorSession(const Env &env, const char *model_path, const SessionOptions &options)
Wraps OrtModelEditorApi::CreateModelEditorSession.
Session(const Env &env, const char *model_path, const SessionOptions &options)
ConstSession GetConst() const
Definition onnxruntime_cxx_api.h:1761
Session(const Env &env, const void *model_data, size_t model_data_length, const SessionOptions &options)
Wraps OrtApi::CreateSessionFromArray.
Wrapper around OrtSessionOptions.
Definition onnxruntime_cxx_api.h:1453
SessionOptions(std::nullptr_t)
Create an empty SessionOptions object, must be assigned a valid one to be used.
Definition onnxruntime_cxx_api.h:1454
UnownedSessionOptions GetUnowned() const
Definition onnxruntime_cxx_api.h:1457
SessionOptions()
Wraps OrtApi::CreateSessionOptions.
ConstSessionOptions GetConst() const
Definition onnxruntime_cxx_api.h:1458
SessionOptions(OrtSessionOptions *p)
Used for interop with the C API.
Definition onnxruntime_cxx_api.h:1456
Definition onnxruntime_cxx_api.h:2828
SymbolicInteger & operator=(const SymbolicInteger &)=default
SymbolicInteger(const SymbolicInteger &)=default
int64_t AsInt() const
Definition onnxruntime_cxx_api.h:2849
int64_t i_
Definition onnxruntime_cxx_api.h:2856
const char * s_
Definition onnxruntime_cxx_api.h:2857
bool operator==(const SymbolicInteger &dim) const
Definition onnxruntime_cxx_api.h:2837
SymbolicInteger & operator=(SymbolicInteger &&)=default
SymbolicInteger(SymbolicInteger &&)=default
const char * AsSym() const
Definition onnxruntime_cxx_api.h:2850
SymbolicInteger(int64_t i)
Definition onnxruntime_cxx_api.h:2829
SymbolicInteger(const char *s)
Definition onnxruntime_cxx_api.h:2830
bool IsInt() const
Definition onnxruntime_cxx_api.h:2848
Provide access to per-node attributes and input shapes, so one could compute and set output shapes.
Definition onnxruntime_cxx_api.h:2827
Ints GetAttrInts(const char *attr_name)
Strings GetAttrStrings(const char *attr_name)
Status SetOutputShape(size_t indice, const Shape &shape, ONNXTensorElementDataType type=ONNX_TENSOR_ELEMENT_DATA_TYPE_FLOAT)
std::vector< SymbolicInteger > Shape
Definition onnxruntime_cxx_api.h:2862
std::vector< float > Floats
Definition onnxruntime_cxx_api.h:2879
std::string GetAttrString(const char *attr_name)
std::vector< int64_t > Ints
Definition onnxruntime_cxx_api.h:2874
ShapeInferContext(const OrtApi *ort_api, OrtShapeInferContext *ctx)
int64_t GetAttrInt(const char *attr_name)
size_t GetInputCount() const
Definition onnxruntime_cxx_api.h:2868
std::vector< std::string > Strings
Definition onnxruntime_cxx_api.h:2884
Floats GetAttrFloats(const char *attr_name)
const Shape & GetInputShape(size_t indice) const
Definition onnxruntime_cxx_api.h:2866
float GetAttrFloat(const char *attr_name)
The Status that holds ownership of OrtStatus received from C API Use it to safely destroy OrtStatus* ...
Definition onnxruntime_cxx_api.h:794
OrtErrorCode GetErrorCode() const
Status(const Exception &)
Creates status instance out of exception.
bool IsOK() const noexcept
Returns true if instance represents an OK (non-error) status.
Status(OrtStatus *status) noexcept
Takes ownership of OrtStatus instance returned from the C API.
std::string GetErrorMessage() const
Status()=default
Status(const std::exception &)
Creates status instance out of exception.
Status(const char *message, OrtErrorCode code)
Creates status instance out of null-terminated string message.
Status(std::nullptr_t) noexcept
Create an empty object, must be assigned a valid one to be used.
Definition onnxruntime_cxx_api.h:796
Definition onnxruntime_cxx_api.h:1077
SyncStream(OrtSyncStream *p)
Definition onnxruntime_cxx_api.h:1081
SyncStream(std::nullptr_t)
< Create an empty SyncStream object, must be assigned a valid one to be used
Definition onnxruntime_cxx_api.h:1079
The TensorRTOptions (V2)
Definition onnxruntime_cxx_api.h:840
void Update(const std::unordered_map< std::string, std::string > &options)
Wrapper around OrtApi::UpdateTensorRTProviderOptions.
void UpdateWithValue(const char *key, void *value)
Wrapper around OrtApi::GetTensorRTProviderOptionsByName.
std::string GetTensorRTProviderOptionsAsString() const
void * GetOptionByName(const char *name) const
Wrapper around OrtApi::GetTensorRTProviderOptionsAsString.
TensorRTProviderOptions(std::nullptr_t)
Definition onnxruntime_cxx_api.h:841
TensorRTProviderOptions()
Wraps OrtApi::CreateTensorRTProviderOptionsV2.
Wrapper around OrtTensorTypeAndShapeInfo.
Definition onnxruntime_cxx_api.h:1796
TensorTypeAndShapeInfo(std::nullptr_t)
Create an empty TensorTypeAndShapeInfo object, must be assigned a valid one to be used.
Definition onnxruntime_cxx_api.h:1801
ConstTensorTypeAndShapeInfo GetConst() const
Definition onnxruntime_cxx_api.h:1812
TensorTypeAndShapeInfo(OrtTensorTypeAndShapeInfo *p)
Used for interop with the C API.
Definition onnxruntime_cxx_api.h:1803
TensorTypeAndShapeInfo(ONNXTensorElementDataType element_type, const std::vector< int64_t > &dims, const std::vector< std::string > *symbolic_dims=nullptr)
The ThreadingOptions.
Definition onnxruntime_cxx_api.h:810
ThreadingOptions & SetGlobalCustomThreadCreationOptions(void *ort_custom_thread_creation_options)
Wraps OrtApi::SetGlobalCustomThreadCreationOptions.
ThreadingOptions()
Wraps OrtApi::CreateThreadingOptions.
ThreadingOptions & SetGlobalInterOpNumThreads(int inter_op_num_threads)
Wraps OrtApi::SetGlobalInterOpNumThreads.
ThreadingOptions & SetGlobalCustomCreateThreadFn(OrtCustomCreateThreadFn ort_custom_create_thread_fn)
Wraps OrtApi::SetGlobalCustomCreateThreadFn.
ThreadingOptions & SetGlobalCustomJoinThreadFn(OrtCustomJoinThreadFn ort_custom_join_thread_fn)
Wraps OrtApi::SetGlobalCustomJoinThreadFn.
ThreadingOptions & SetGlobalSpinControl(int allow_spinning)
Wraps OrtApi::SetGlobalSpinControl.
ThreadingOptions & SetGlobalDenormalAsZero()
Wraps OrtApi::SetGlobalDenormalAsZero.
ThreadingOptions & SetGlobalIntraOpNumThreads(int intra_op_num_threads)
Wraps OrtApi::SetGlobalIntraOpNumThreads.
Type information that may contain either TensorTypeAndShapeInfo or the information about contained se...
Definition onnxruntime_cxx_api.h:1902
static TypeInfo CreateOptionalTypeInfo(ConstTypeInfo contained_type)
static TypeInfo CreateSequenceTypeInfo(ConstTypeInfo sequence_type)
static TypeInfo CreateTensorInfo(ConstTensorTypeAndShapeInfo tensor_info)
static TypeInfo CreateSparseTensorInfo(ConstTensorTypeAndShapeInfo sparse_tensor_info)
TypeInfo(std::nullptr_t)
Create an empty TypeInfo object, must be assigned a valid one to be used.
Definition onnxruntime_cxx_api.h:1907
static TypeInfo CreateMapTypeInfo(ONNXTensorElementDataType key_type, ConstTypeInfo value_type)
ConstTypeInfo GetConst() const
Definition onnxruntime_cxx_api.h:1918
TypeInfo(OrtTypeInfo *p)
C API Interop.
Definition onnxruntime_cxx_api.h:1908
Wrapper around OrtValue.
Definition onnxruntime_cxx_api.h:2258
static Value CreateSparseTensor(const OrtMemoryInfo *info, void *p_data, const Shape &dense_shape, const Shape &values_shape, ONNXTensorElementDataType type)
Creates an OrtValue instance containing SparseTensor. This constructs a sparse tensor that makes use ...
static Value CreateSparseTensor(const OrtMemoryInfo *info, T *p_data, const Shape &dense_shape, const Shape &values_shape)
This is a simple forwarding method to the other overload that helps deducing data type enum value fro...
Value & operator=(Value &&)=default
static Value CreateSparseTensor(OrtAllocator *allocator, const Shape &dense_shape, ONNXTensorElementDataType type)
Creates an instance of OrtValue containing sparse tensor. The created instance has no data....
Value(Value &&)=default
Value(std::nullptr_t)
Create an empty Value object, must be assigned a valid one to be used.
Definition onnxruntime_cxx_api.h:2264
static Value CreateTensor(const OrtMemoryInfo *info, T *p_data, size_t p_data_element_count, const int64_t *shape, size_t shape_len)
Creates a tensor with a user supplied buffer. Wraps OrtApi::CreateTensorWithDataAsOrtValue.
static Value CreateSparseTensor(OrtAllocator *allocator, const Shape &dense_shape)
This is a simple forwarding method to the below CreateSparseTensor. This helps to specify data type e...
static Value CreateTensor(OrtAllocator *allocator, const int64_t *shape, size_t shape_len, ONNXTensorElementDataType type)
Creates an OrtValue with a tensor using the supplied OrtAllocator. Wraps OrtApi::CreateTensorAsOrtVal...
UnownedValue GetUnowned() const
Definition onnxruntime_cxx_api.h:2269
static Value CreateSequence(const std::vector< Value > &values)
Creates an OrtValue with a Sequence Onnx type representation. The API would ref-count the supplied Or...
static Value CreateMap(const Value &keys, const Value &values)
Creates an OrtValue with a Map Onnx type representation. The API would ref-count the supplied OrtValu...
static Value CreateTensor(const OrtMemoryInfo *info, void *p_data, size_t p_data_byte_count, const int64_t *shape, size_t shape_len, ONNXTensorElementDataType type)
Creates a tensor with a user supplied buffer. Wraps OrtApi::CreateTensorWithDataAsOrtValue.
static Value CreateTensor(OrtAllocator *allocator, const int64_t *shape, size_t shape_len)
Creates an OrtValue with a tensor using a supplied OrtAllocator. Wraps OrtApi::CreateTensorAsOrtValue...
static Value CreateOpaque(const char *domain, const char *type_name, const T &value)
Creates an OrtValue wrapping an Opaque type. This is used for experimental support of non-tensor type...
static Value CreateTensor(OrtAllocator *deleter, void *p_data, size_t p_data_byte_count, const int64_t *shape, size_t shape_len, ONNXTensorElementDataType type)
Creates a tensor with a user supplied buffer. Wraps OrtApi::CreateTensorWithDataAndDeleterAsOrtValue.
ConstValue GetConst() const
Definition onnxruntime_cxx_api.h:2268
Definition onnxruntime_cxx_api.h:3175
int64_t index
Definition onnxruntime_cxx_api.h:3179
ConstNode node
Definition onnxruntime_cxx_api.h:3176
Wrapper around OrtValueInfo.
Definition onnxruntime_cxx_api.h:3080
ConstValueInfo GetConst() const
Definition onnxruntime_cxx_api.h:3090
ValueInfo(std::nullptr_t)
Definition onnxruntime_cxx_api.h:3082
ValueInfo(const std::string &name, const ConstTypeInfo &type_info)
ValueInfo(OrtValueInfo *p)
Take ownership of a pointer created by C API.
Definition onnxruntime_cxx_api.h:3084
ValueInfo()=default
Definition onnxruntime_cxx_api.h:756
AllocatedFree(OrtAllocator *allocator)
Definition onnxruntime_cxx_api.h:758
OrtAllocator * allocator_
Definition onnxruntime_cxx_api.h:757
void operator()(void *ptr) const
Definition onnxruntime_cxx_api.h:760
Base & operator=(Base &&v) noexcept
Definition onnxruntime_cxx_api.h:742
constexpr contained_type & operator*() const noexcept
Definition onnxruntime_cxx_api.h:749
typename Unowned< T >::Type contained_type
Definition onnxruntime_cxx_api.h:731
Base(Base &&v) noexcept
Definition onnxruntime_cxx_api.h:741
Base(const Base &)=default
constexpr Base(contained_type *p) noexcept
Definition onnxruntime_cxx_api.h:734
Base & operator=(const Base &)=default
Used internally by the C++ API. C++ wrapper types inherit from this. This is a zero cost abstraction ...
Definition onnxruntime_cxx_api.h:684
Base(Base &&v) noexcept
Definition onnxruntime_cxx_api.h:696
constexpr Base()=default
constexpr contained_type & operator*() const noexcept
Definition onnxruntime_cxx_api.h:704
contained_type * release()
Relinquishes ownership of the contained C object pointer The underlying object is not destroyed.
Definition onnxruntime_cxx_api.h:708
Base(const Base &)=delete
constexpr Base(contained_type *p) noexcept
Definition onnxruntime_cxx_api.h:688
Base & operator=(const Base &)=delete
Base & operator=(Base &&v) noexcept
Definition onnxruntime_cxx_api.h:697
contained_type * p_
Definition onnxruntime_cxx_api.h:715
~Base()
Definition onnxruntime_cxx_api.h:689
T contained_type
Definition onnxruntime_cxx_api.h:685
Definition onnxruntime_cxx_api.h:890
const std::basic_string< char > GetFilePath() const
Definition onnxruntime_cxx_api.h:3190
std::vector< ConstNode > GetNodes() const
std::vector< ConstValueInfo > GetInputs() const
ConstNode GetParentNode() const
int64_t GetOnnxIRVersion() const
std::basic_string< char > GetModelPath() const
Graph GetGraphView(const std::vector< ConstNode > &nodes) const
ModelMetadata GetModelMetadata() const
Wraps OrtApi::Graph_GetModelMetadata.
std::vector< ConstValueInfo > GetInitializers() const
std::string GetName() const
std::vector< ConstValueInfo > GetOutputs() const
std::vector< OperatorSet > GetOperatorSets() const
Definition onnxruntime_cxx_api.h:2437
std::vector< Value > GetOutputValues(OrtAllocator *) const
std::vector< std::string > GetOutputNames(OrtAllocator *) const
std::vector< Value > GetOutputValues() const
std::vector< std::string > GetOutputNames() const
Definition onnxruntime_cxx_api.h:3102
std::vector< ConstValueInfo > GetOutputs() const
std::vector< ConstValueInfo > GetImplicitInputs() const
std::string GetName() const
std::string GetDomain() const
std::vector< AttrNameSubgraph > GetSubgraphs() const
ConstGraphImpl< detail::Unowned< const OrtGraph > > GetGraph() const
std::string GetOperatorType() const
std::vector< ConstOpAttr > GetAttributes() const
std::vector< ConstValueInfo > GetInputs() const
Status GetAttributeByName(const std::string &name, ConstOpAttr &attr) const
std::string GetEpName() const
Definition onnxruntime_cxx_api.h:2506
std::string GetName() const
Status GetValue(R &out) const
Status GetTensorAttributeAsOrtValue(Value &) const
Status GetValueArray(std::vector< R > &out) const
OrtOpAttrType GetType() const
Definition onnxruntime_cxx_api.h:1586
std::vector< std::string > GetOutputNames() const
TypeInfo GetInputTypeInfo(size_t index) const
Wraps OrtApi::SessionGetInputTypeInfo.
size_t GetOutputCount() const
Returns the number of model outputs.
std::vector< ValueInfo > GetOutputs() const
int GetOpset(const std::string &domain) const
Wraps OrtApi::SessionGetOpsetForDomain.
uint64_t GetProfilingStartTimeNs() const
Wraps OrtApi::SessionGetProfilingStartTimeNs.
std::vector< std::string > GetOverridableInitializerNames() const
ModelMetadata GetModelMetadata() const
Wraps OrtApi::SessionGetModelMetadata.
size_t GetInputCount() const
Returns the number of model inputs.
TypeInfo GetOutputTypeInfo(size_t index) const
Wraps OrtApi::SessionGetOutputTypeInfo.
std::vector< std::string > GetInputNames() const
AllocatedStringPtr GetOverridableInitializerNameAllocated(size_t index, OrtAllocator *allocator) const
Returns a copy of the overridable initializer name at then specified index.
std::vector< ConstEpDevice > GetEpDeviceForInputs() const
Wrapper for OrtApi::SessionGetEpDeviceForInputs.
AllocatedStringPtr GetOutputNameAllocated(size_t index, OrtAllocator *allocator) const
Returns a copy of output name at then specified index.
size_t GetOverridableInitializerCount() const
Returns the number of inputs that have defaults that can be overridden.
std::vector< ConstMemoryInfo > GetMemoryInfoForOutputs() const
Wrapper for OrtApi::SessionGetMemoryInfoForOutputs.
AllocatedStringPtr GetInputNameAllocated(size_t index, OrtAllocator *allocator) const
Returns a copy of input name at the specified index.
std::vector< ConstMemoryInfo > GetMemoryInfoForInputs() const
Wrapper for OrtApi::SessionGetMemoryInfoForInputs.
std::vector< ValueInfo > GetInputs() const
TypeInfo GetOverridableInitializerTypeInfo(size_t index) const
Wraps OrtApi::SessionGetOverridableInitializerTypeInfo.
Definition onnxruntime_cxx_api.h:1947
void GetStringTensorContent(void *buffer, size_t buffer_length, size_t *offsets, size_t offsets_count) const
The API copies all of the UTF-8 encoded string data contained within a tensor or a sparse tensor into...
void GetStringTensorElement(size_t buffer_length, size_t element_index, void *buffer) const
The API copies UTF-8 encoded bytes for the requested string element contained within a tensor or a sp...
TensorTypeAndShapeInfo GetSparseTensorIndicesTypeShapeInfo(OrtSparseIndicesFormat format) const
The API returns type and shape information for the specified indices. Each supported indices have the...
const void * GetTensorRawData() const
Returns a non-typed pointer to a tensor contained data.
std::string GetStringTensorElement(size_t element_index) const
Returns string tensor UTF-8 encoded string element. Use of this API is recommended over GetStringTens...
size_t GetStringTensorElementLength(size_t element_index) const
The API returns a byte length of UTF-8 encoded string element contained in either a tensor or a spare...
size_t GetStringTensorDataLength() const
This API returns a full length of string data contained within either a tensor or a sparse Tensor....
bool IsSparseTensor() const
Returns true if the OrtValue contains a sparse tensor.
TypeInfo GetTypeInfo() const
The API returns type information for data contained in a tensor. For sparse tensors it returns type i...
const R * GetSparseTensorIndicesData(OrtSparseIndicesFormat indices_format, size_t &num_indices) const
The API retrieves a pointer to the internal indices buffer. The API merely performs a convenience dat...
bool IsTensor() const
Returns true if Value is a tensor, false for other types like map/sequence/etc.
ConstMemoryInfo GetTensorMemoryInfo() const
This API returns information about the memory allocation used to hold data.
size_t GetTensorSizeInBytes() const
Returns the total size of the tensor data in bytes. Throws an exception if the OrtValue does not cont...
const R * GetSparseTensorValues() const
The API returns a pointer to an internal buffer of the sparse tensor containing non-zero values....
TensorTypeAndShapeInfo GetTensorTypeAndShapeInfo() const
The API returns type information for data contained in a tensor. For sparse tensors it returns type i...
Value GetValue(int index, OrtAllocator *allocator) const
size_t GetCount() const
< Return true if OrtValue contains data and returns false if the OrtValue is a None
void GetOpaqueData(const char *domain, const char *type_name, R &) const
Obtains a pointer to a user defined data for experimental purposes.
TensorTypeAndShapeInfo GetSparseTensorValuesTypeAndShapeInfo() const
The API returns type and shape information for stored non-zero values of the sparse tensor....
const R * GetTensorData() const
Returns a const typed pointer to the tensor contained data. No type checking is performed,...
OrtSparseFormat GetSparseFormat() const
The API returns the sparse data format this OrtValue holds in a sparse tensor. If the sparse tensor w...
Definition onnxruntime_cxx_api.h:3045
Status GetInitializer(ConstValue &value) const
< A wrapper around OrtApi::ValueInfo_GetInitializerValue
std::string GetName() const
< A wrapper around OrtApi::GetValueInfoName
bool IsFromOuterScope() const
< A wrapper around OrtApi::ValueInfo_IsFromOuterScope
Status GetExternalInitializerInfo(ExternalInitializerInfo &info) const
< A wrapper around OrtApi::ValueInfo_GetExternalInitializerInfo
bool IsConstantInitializer() const
< A wrapper around OrtApi::ValueInfo_IsConstantInitializer
std::vector< ValueInfoConsumerProducerInfo > GetConsumers() const
< A wrapper around OrtApi::ValueInfo_GetValueConsumers
bool IsGraphOutput() const
< A wrapper around OrtApi::ValueInfo_IsGraphOutput
bool IsRequiredGraphInput() const
< A wrapper around OrtApi::ValueInfo_IsRequiredGraphInput
ConstTypeInfo TypeInfo() const
< A wrapper around OrtApi::GetValueInfoTypeInfo
ValueInfoConsumerProducerInfo GetProducerNode() const
bool IsOptionalGraphInput() const
< A wrapper around OrtApi::ValueInfo_IsOptionalGraphInput
Definition onnxruntime_cxx_api.h:1107
const char * EpName() const
const char * EpVendor() const
ConstKeyValuePairs EpOptions() const
ConstHardwareDevice Device() const
ConstMemoryInfo GetMemoryInfo(OrtDeviceMemoryType memory_type) const
Wraps EpDevice_MemoryInfo.
SyncStream CreateSyncStream(ConstKeyValuePairs stream_options={}) const
ConstKeyValuePairs EpMetadata() const
Definition onnxruntime_cxx_api.h:3219
void SetInputs(std::vector< ValueInfo > &inputs)
void SetOutputs(std::vector< ValueInfo > &outputs)
void AddNode(Node &node)
void AddInitializer(const std::string &name, Value &initializer, bool data_is_external)
Definition onnxruntime_cxx_api.h:1088
OrtHardwareDeviceType Type() const
const char * Vendor() const
ConstKeyValuePairs Metadata() const
Definition onnxruntime_cxx_api.h:2448
void BindOutput(const char *name, const Value &)
void BindInput(const char *name, const Value &)
void BindOutput(const char *name, const OrtMemoryInfo *)
Definition onnxruntime_cxx_api.h:930
void GetKeyValuePairs(std::vector< const char * > &keys, std::vector< const char * > &values) const
std::unordered_map< std::string, std::string > GetKeyValuePairs() const
const char * GetValue(const char *key) const
Definition onnxruntime_cxx_api.h:1854
ONNXTensorElementDataType GetMapKeyType() const
Wraps OrtApi::GetMapKeyType.
TypeInfo GetMapValueType() const
Wraps OrtApi::GetMapValueType.
Definition onnxruntime_cxx_api.h:969
std::string GetAllocatorName() const
Wrapper MemoryInfoGetName.
int GetDeviceId() const
Wrapper MemoryInfoGetId.
OrtMemType GetMemoryType() const
Wrapper MemoryInfoGetMemType.
OrtDeviceMemoryType GetDeviceMemoryType() const
Wrapper MemoryInfoGetDeviceMemType.
OrtMemoryInfoDeviceType GetDeviceType() const
Wrapper MemoryInfoGetDeviceType.
OrtAllocatorType GetAllocatorType() const
Wrapper MemoryInfoGetType.
uint32_t GetVendorId() const
Wrapper MemoryInfoGetVendorId.
bool operator==(const MemoryInfoImpl< U > &o) const
Definition onnxruntime_cxx_api.h:3259
void AddGraph(Graph &graph)
Definition onnxruntime_cxx_api.h:1841
TypeInfo GetOptionalElementType() const
Wraps OrtApi::CastOptionalTypeToContainedTypeInfo.
Definition onnxruntime_cxx_api.h:1930
const char ** str
Definition onnxruntime_cxx_api.h:1935
const int64_t * values_shape
Definition onnxruntime_cxx_api.h:1931
size_t values_shape_len
Definition onnxruntime_cxx_api.h:1932
const void * p_data
Definition onnxruntime_cxx_api.h:1934
Definition onnxruntime_cxx_api.h:1817
TypeInfo GetSequenceElementType() const
Wraps OrtApi::GetSequenceElementType.
Definition onnxruntime_cxx_api.h:1644
void SetEpDynamicOptions(const char *const *keys, const char *const *values, size_t kv_len)
Set DynamicOptions for EPs (Execution Providers)
AllocatedStringPtr EndProfilingAllocated(OrtAllocator *allocator)
End profiling and return a copy of the profiling file name.
void FinalizeModelEditorSession(const Model &model, const SessionOptions &options, OrtPrepackedWeightsContainer *prepacked_weights_container=nullptr)
void Run(const RunOptions &run_options, const IoBinding &)
Wraps OrtApi::RunWithBinding.
void RunAsync(const RunOptions &run_options, const char *const *input_names, const Value *input_values, size_t input_count, const char *const *output_names, Value *output_values, size_t output_count, RunAsyncCallbackFn callback, void *user_data)
Run the model asynchronously in a thread owned by intra op thread pool.
std::vector< Value > Run(const RunOptions &run_options, const char *const *input_names, const Value *input_values, size_t input_count, const char *const *output_names, size_t output_count)
Run the model returning results in an Ort allocated vector.
void Run(const RunOptions &run_options, const char *const *input_names, const Value *input_values, size_t input_count, const char *const *output_names, Value *output_values, size_t output_count)
Run the model returning results in user provided outputs Same as Run(const RunOptions&,...
Definition onnxruntime_cxx_api.h:1941
const int64_t * shape
Definition onnxruntime_cxx_api.h:1942
size_t shape_len
Definition onnxruntime_cxx_api.h:1943
Definition onnxruntime_cxx_api.h:1069
void * GetHandle()
Wraps SyncStream_GetHandle.
Definition onnxruntime_cxx_api.h:1767
size_t GetElementCount() const
Wraps OrtApi::GetTensorShapeElementCount.
void GetDimensions(int64_t *values, size_t values_count) const
Wraps OrtApi::GetDimensions.
std::vector< int64_t > GetShape() const
Uses GetDimensionsCount & GetDimensions to return a std::vector of the shape.
std::vector< const char * > GetSymbolicDimensions() const
void GetSymbolicDimensions(const char **values, size_t values_count) const
Wraps OrtApi::GetSymbolicDimensions.
size_t GetDimensionsCount() const
Wraps OrtApi::GetDimensionsCount.
ONNXTensorElementDataType GetElementType() const
Wraps OrtApi::GetTensorElementType.
bool HasShape() const
Wraps OrtApi::TensorTypeAndShape_HasShape.
Definition onnxruntime_cxx_api.h:1879
ONNXType GetONNXType() const
ConstSequenceTypeInfo GetSequenceTypeInfo() const
Wraps OrtApi::CastTypeInfoToSequenceTypeInfo.
ConstMapTypeInfo GetMapTypeInfo() const
Wraps OrtApi::CastTypeInfoToMapTypeInfo.
ConstOptionalTypeInfo GetOptionalTypeInfo() const
wraps OrtApi::CastTypeInfoToOptionalTypeInfo
ConstTensorTypeAndShapeInfo GetTensorTypeAndShapeInfo() const
Wraps OrtApi::CastTypeInfoToTensorInfo.
This is a tagging template type. Use it with Base<T> to indicate that the C++ interface object has no...
Definition onnxruntime_cxx_api.h:660
T Type
Definition onnxruntime_cxx_api.h:661
Definition onnxruntime_cxx_api.h:2116
void FillStringTensorElement(const char *s, size_t index)
Set a single string in a string tensor.
R * GetTensorMutableData()
Returns a non-const typed pointer to an OrtValue/Tensor contained buffer No type checking is performe...
R & At(const std::vector< int64_t > &location)
void UseBlockSparseIndices(const Shape &indices_shape, int32_t *indices_data)
Supplies BlockSparse format specific indices and marks the contained sparse tensor as being a BlockSp...
void FillSparseTensorBlockSparse(const OrtMemoryInfo *data_mem_info, const OrtSparseValuesParam &values, const Shape &indices_shape, const int32_t *indices_data)
The API will allocate memory using the allocator instance supplied to the CreateSparseTensor() API an...
void * GetTensorMutableRawData()
Returns a non-typed non-const pointer to a tensor contained data.
void UseCooIndices(int64_t *indices_data, size_t indices_num)
Supplies COO format specific indices and marks the contained sparse tensor as being a COO format tens...
void FillSparseTensorCoo(const OrtMemoryInfo *data_mem_info, const OrtSparseValuesParam &values_param, const int64_t *indices_data, size_t indices_num)
The API will allocate memory using the allocator instance supplied to the CreateSparseTensor() API an...
void FillStringTensor(const char *const *s, size_t s_len)
Set all strings at once in a string tensor.
void UseCsrIndices(int64_t *inner_data, size_t inner_num, int64_t *outer_data, size_t outer_num)
Supplies CSR format specific indices and marks the contained sparse tensor as being a CSR format tens...
void FillSparseTensorCsr(const OrtMemoryInfo *data_mem_info, const OrtSparseValuesParam &values, const int64_t *inner_indices_data, size_t inner_indices_num, const int64_t *outer_indices_data, size_t outer_indices_num)
The API will allocate memory using the allocator instance supplied to the CreateSparseTensor() API an...
char * GetResizedStringTensorElementBuffer(size_t index, size_t buffer_length)
Allocate if necessary and obtain a pointer to a UTF-8 encoded string element buffer indexed by the fl...
Memory allocation interface.
Definition onnxruntime_c_api.h:346
void(* Free)(struct OrtAllocator *this_, void *p)
Free a block of memory previously allocated with OrtAllocator::Alloc.
Definition onnxruntime_c_api.h:353
const OrtApi *(* GetApi)(uint32_t version)
Get a pointer to the requested version of the OrtApi.
Definition onnxruntime_c_api.h:898
Definition onnxruntime_c_api.h:968
const OrtEpApi *(* GetEpApi)(void)
Get the OrtEpApi instance for implementing an execution provider.
Definition onnxruntime_c_api.h:5437
const OrtCompileApi *(* GetCompileApi)(void)
Get the Compile API instance.
Definition onnxruntime_c_api.h:5169
void(* ReleaseTensorRTProviderOptions)(OrtTensorRTProviderOptionsV2 *input)
Release an OrtTensorRTProviderOptionsV2.
Definition onnxruntime_c_api.h:3224
const OrtModelEditorApi *(* GetModelEditorApi)(void)
Get the Model Editor API instance.
Definition onnxruntime_c_api.h:5111
void(* ReleaseCUDAProviderOptions)(OrtCUDAProviderOptionsV2 *input)
Release an OrtCUDAProviderOptionsV2.
Definition onnxruntime_c_api.h:3727
CUDA Provider Options.
Definition onnxruntime_c_api.h:601
The OrtCompileApi struct provides functions to compile ONNX models.
Definition onnxruntime_c_api.h:7144
Definition onnxruntime_c_api.h:6617
int(* GetVariadicInputHomogeneity)(const struct OrtCustomOp *op)
Definition onnxruntime_c_api.h:6663
OrtCustomOpInputOutputCharacteristic(* GetOutputCharacteristic)(const struct OrtCustomOp *op, size_t index)
Definition onnxruntime_c_api.h:6647
size_t(* GetInputTypeCount)(const struct OrtCustomOp *op)
Definition onnxruntime_c_api.h:6635
int(* GetVariadicOutputMinArity)(const struct OrtCustomOp *op)
Definition onnxruntime_c_api.h:6667
size_t(* GetAliasMap)(int **input_index, int **output_index)
Definition onnxruntime_c_api.h:6700
int(* GetStartVersion)(const struct OrtCustomOp *op)
Definition onnxruntime_c_api.h:6685
void(* ReleaseMayInplace)(int *input_index, int *output_index)
Definition onnxruntime_c_api.h:6697
const char *(* GetName)(const struct OrtCustomOp *op)
Definition onnxruntime_c_api.h:6628
size_t(* GetOutputTypeCount)(const struct OrtCustomOp *op)
Definition onnxruntime_c_api.h:6637
void(* KernelDestroy)(void *op_kernel)
Definition onnxruntime_c_api.h:6643
int(* GetVariadicOutputHomogeneity)(const struct OrtCustomOp *op)
Definition onnxruntime_c_api.h:6672
OrtMemType(* GetInputMemoryType)(const struct OrtCustomOp *op, size_t index)
Definition onnxruntime_c_api.h:6654
void *(* CreateKernel)(const struct OrtCustomOp *op, const OrtApi *api, const OrtKernelInfo *info)
Definition onnxruntime_c_api.h:6624
uint32_t version
Definition onnxruntime_c_api.h:6618
ONNXTensorElementDataType(* GetInputType)(const struct OrtCustomOp *op, size_t index)
Definition onnxruntime_c_api.h:6634
void(* ReleaseAliasMap)(int *input_index, int *output_index)
Definition onnxruntime_c_api.h:6701
OrtCustomOpInputOutputCharacteristic(* GetInputCharacteristic)(const struct OrtCustomOp *op, size_t index)
Definition onnxruntime_c_api.h:6646
const char *(* GetExecutionProviderType)(const struct OrtCustomOp *op)
Definition onnxruntime_c_api.h:6631
ONNXTensorElementDataType(* GetOutputType)(const struct OrtCustomOp *op, size_t index)
Definition onnxruntime_c_api.h:6636
int(* GetVariadicInputMinArity)(const struct OrtCustomOp *op)
Definition onnxruntime_c_api.h:6658
OrtStatusPtr(* InferOutputShapeFn)(const struct OrtCustomOp *op, OrtShapeInferContext *)
Definition onnxruntime_c_api.h:6682
int(* GetEndVersion)(const struct OrtCustomOp *op)
Definition onnxruntime_c_api.h:6686
OrtStatusPtr(* CreateKernelV2)(const struct OrtCustomOp *op, const OrtApi *api, const OrtKernelInfo *info, void **kernel)
Definition onnxruntime_c_api.h:6675
size_t(* GetMayInplace)(int **input_index, int **output_index)
Definition onnxruntime_c_api.h:6693
OrtStatusPtr(* KernelComputeV2)(void *op_kernel, OrtKernelContext *context)
Definition onnxruntime_c_api.h:6680
void(* KernelCompute)(void *op_kernel, OrtKernelContext *context)
Definition onnxruntime_c_api.h:6642
MIGraphX Provider Options.
Definition onnxruntime_c_api.h:805
The OrtModelEditorApi struct provides functions to create or edit an ONNX model.
Definition onnxruntime_c_api.h:6715
OpenVINO Provider Options.
Definition onnxruntime_c_api.h:844
ROCM Provider Options.
Definition onnxruntime_c_api.h:688
TensorRT Provider Options.
Definition onnxruntime_c_api.h:777