ONNX Runtime
Loading...
Searching...
No Matches
onnxruntime_cxx_api.h
1// Copyright (c) Microsoft Corporation. All rights reserved.
2// Licensed under the MIT License.
3
4// Summary: The Ort C++ API is a header only wrapper around the Ort C API.
5//
6// The C++ API simplifies usage by returning values directly instead of error codes, throwing exceptions on errors
7// and automatically releasing resources in the destructors. The primary purpose of C++ API is exception safety so
8// all the resources follow RAII and do not leak memory.
9//
10// Each of the C++ wrapper classes holds only a pointer to the C internal object. Treat them like smart pointers.
11// To create an empty object, pass 'nullptr' to the constructor (for example, Env e{nullptr};). However, you can't use them
12// until you assign an instance that actually holds an underlying object.
13//
14// For Ort objects only move assignment between objects is allowed, there are no copy constructors.
15// Some objects have explicit 'Clone' methods for this purpose.
16//
17// ConstXXXX types are copyable since they do not own the underlying C object, so you can pass them to functions as arguments
18// by value or by reference. ConstXXXX types are restricted to const only interfaces.
19//
20// UnownedXXXX are similar to ConstXXXX but also allow non-const interfaces.
21//
22// The lifetime of the corresponding owning object must eclipse the lifetimes of the ConstXXXX/UnownedXXXX types. They exists so you do not
23// have to fallback to C types and the API with the usual pitfalls. In general, do not use C API from your C++ code.
24
25#pragma once
26#include "onnxruntime_c_api.h"
27#include "onnxruntime_float16.h"
28
29#include <array>
30#include <cstddef>
31#include <cstdio>
32#include <memory>
33#include <stdexcept>
34#include <string>
35#include <type_traits>
36#include <unordered_map>
37#include <utility>
38#include <variant>
39#include <vector>
40
41#ifdef ORT_NO_EXCEPTIONS
42#include <iostream>
43#endif
44
48namespace Ort {
49
54struct Exception : std::exception {
55 Exception(const std::string& string, OrtErrorCode code) : message_{string}, code_{code} {}
56 Exception(std::string&& string, OrtErrorCode code) : message_{std::move(string)}, code_{code} {}
57
58 OrtErrorCode GetOrtErrorCode() const { return code_; }
59 const char* what() const noexcept override { return message_.c_str(); }
60
61 private:
62 std::string message_;
63 OrtErrorCode code_;
64};
65
66#ifdef ORT_NO_EXCEPTIONS
67// The #ifndef is for the very special case where the user of this library wants to define their own way of handling errors.
68// NOTE: This header expects control flow to not continue after calling ORT_CXX_API_THROW
69#ifndef ORT_CXX_API_THROW
70#define ORT_CXX_API_THROW(string, code) \
71 do { \
72 std::cerr << Ort::Exception(string, code) \
73 .what() \
74 << std::endl; \
75 abort(); \
76 } while (false)
77#endif
78#else
79#define ORT_CXX_API_THROW(string, code) \
80 throw Ort::Exception(string, code)
81#endif
82
83#ifdef ORT_API_MANUAL_INIT
84// If the macro ORT_API_MANUAL_INIT is defined, no static initialization
85// will be performed. Instead, users must call InitApi() before using the
86// ORT C++ APIs..
87//
88// InitApi() sets the global API object using the default initialization
89// logic. Users call this to initialize the ORT C++ APIs at a time that
90// makes sense in their program.
91inline void InitApi() noexcept;
92
93// InitApi(const OrtApi*) is used by custom operator libraries that are not
94// linked to onnxruntime. It sets the global API object, which is required
95// by the ORT C++ APIs.
96//
97// Example mycustomop.cc:
98//
99// #define ORT_API_MANUAL_INIT
100// #include <onnxruntime_cxx_api.h>
101// #undef ORT_API_MANUAL_INIT
102//
103// OrtStatus* ORT_API_CALL RegisterCustomOps(OrtSessionOptions* options, const OrtApiBase* api_base) {
104// Ort::InitApi(api_base->GetApi(ORT_API_VERSION));
105// // ...
106// }
107//
108inline void InitApi(const OrtApi* api) noexcept;
109#endif
110
111namespace detail {
112// This is used internally by the C++ API. This class holds the global
113// variable that points to the OrtApi.
114struct Global {
115 static const OrtApi* Api(const OrtApi* newValue = nullptr) noexcept {
116 // This block-level static will be initialized once when this function is
117 // first executed, delaying the call to DefaultInit() until it is first needed.
118 //
119 // When ORT_API_MANUAL_INIT is not defined, DefaultInit() calls
120 // OrtGetApiBase()->GetApi(), which may result in a shared library being
121 // loaded.
122 //
123 // Using a block-level static instead of a class-level static helps
124 // avoid issues with static initialization order and dynamic libraries
125 // loading other dynamic libraries.
126 //
127 // This makes it safe to include the C++ API headers in a shared library
128 // that is delay loaded or delay loads its dependencies.
129 //
130 // This DOES NOT make it safe to _use_ arbitrary ORT C++ APIs when
131 // initializing static members, however.
132 static const OrtApi* api = DefaultInit();
133
134 if (newValue) {
135 api = newValue;
136 }
137
138 return api;
139 }
140
141 private:
142 // Has different definitions based on ORT_API_MANUAL_INIT
143 static const OrtApi* DefaultInit() noexcept;
144
145#ifdef ORT_API_MANUAL_INIT
146 // Public APIs to set the OrtApi* to use.
147 friend void ::Ort::InitApi() noexcept;
148 friend void ::Ort::InitApi(const OrtApi*) noexcept;
149#endif
150};
151} // namespace detail
152
153#ifdef ORT_API_MANUAL_INIT
154
155// See comments on declaration above for usage.
156inline void InitApi(const OrtApi* api) noexcept { detail::Global::Api(api); }
157inline void InitApi() noexcept { InitApi(OrtGetApiBase()->GetApi(ORT_API_VERSION)); }
158
159#ifdef _MSC_VER
160// If you get a linker error about a mismatch here, you are trying to
161// link two compilation units that have different definitions for
162// ORT_API_MANUAL_INIT together. All compilation units must agree on the
163// definition of ORT_API_MANUAL_INIT.
164#pragma detect_mismatch("ORT_API_MANUAL_INIT", "enabled")
165#endif
166
167inline const OrtApi* detail::Global::DefaultInit() noexcept {
168 // When ORT_API_MANUAL_INIT is defined, there's no default init that can
169 // be done.
170 return nullptr;
171}
172
173#else // ORT_API_MANUAL_INIT
174
175#ifdef _MSC_VER
176// If you get a linker error about a mismatch here, you are trying to link
177// two compilation units that have different definitions for
178// ORT_API_MANUAL_INIT together. All compilation units must agree on the
179// definition of ORT_API_MANUAL_INIT.
180#pragma detect_mismatch("ORT_API_MANUAL_INIT", "disabled")
181#endif
182
183inline const OrtApi* detail::Global::DefaultInit() noexcept {
185}
186#endif // ORT_API_MANUAL_INIT
187
189inline const OrtApi& GetApi() noexcept { return *detail::Global::Api(); }
190
195std::string GetVersionString();
196
202std::string GetBuildInfoString();
203
209std::vector<std::string> GetAvailableProviders();
210
216 auto* api = GetApi().GetModelEditorApi();
217 if (api == nullptr) {
218 // minimal build
219 ORT_CXX_API_THROW("Model Editor API is not available in this build", ORT_FAIL);
220 }
221
222 return *api;
223}
224
230 auto* api = GetApi().GetCompileApi();
231 if (api == nullptr) {
232 // minimal build
233 ORT_CXX_API_THROW("Compile API is not available in this build", ORT_FAIL);
234 }
235
236 return *api;
237}
238
244 auto* api = GetApi().GetInteropApi();
245 if (api == nullptr) {
246 // minimal build
247 ORT_CXX_API_THROW("Interop API is not available in this build", ORT_FAIL);
248 }
249
250 return *api;
251}
252
257inline const OrtEpApi& GetEpApi() {
258 auto* api = GetApi().GetEpApi();
259 if (api == nullptr) {
260 // minimal build
261 ORT_CXX_API_THROW("EP API is not available in this build", ORT_FAIL);
262 }
263
264 return *api;
265}
266
285struct Float16_t : onnxruntime_float16::Float16Impl<Float16_t> {
286 private:
292 constexpr explicit Float16_t(uint16_t v) noexcept { val = v; }
293
294 public:
295 using Base = onnxruntime_float16::Float16Impl<Float16_t>;
296
300 Float16_t() = default;
301
307 constexpr static Float16_t FromBits(uint16_t v) noexcept { return Float16_t(v); }
308
313 explicit Float16_t(float v) noexcept { val = Base::ToUint16Impl(v); }
314
319 float ToFloat() const noexcept { return Base::ToFloatImpl(); }
320
325 using Base::IsNegative;
326
331 using Base::IsNaN;
332
337 using Base::IsFinite;
338
343 using Base::IsPositiveInfinity;
344
349 using Base::IsNegativeInfinity;
350
355 using Base::IsInfinity;
356
361 using Base::IsNaNOrZero;
362
367 using Base::IsNormal;
368
373 using Base::IsSubnormal;
374
379 using Base::Abs;
380
385 using Base::Negate;
386
395 using Base::AreZero;
396
400 explicit operator float() const noexcept { return ToFloat(); }
401
402 using Base::operator==;
403 using Base::operator!=;
404 using Base::operator<;
405};
406
407static_assert(sizeof(Float16_t) == sizeof(uint16_t), "Sizes must match");
408
427struct BFloat16_t : onnxruntime_float16::BFloat16Impl<BFloat16_t> {
428 private:
436 constexpr explicit BFloat16_t(uint16_t v) noexcept { val = v; }
437
438 public:
439 using Base = onnxruntime_float16::BFloat16Impl<BFloat16_t>;
440
441 BFloat16_t() = default;
442
448 static constexpr BFloat16_t FromBits(uint16_t v) noexcept { return BFloat16_t(v); }
449
454 explicit BFloat16_t(float v) noexcept { val = Base::ToUint16Impl(v); }
455
460 float ToFloat() const noexcept { return Base::ToFloatImpl(); }
461
466 using Base::IsNegative;
467
472 using Base::IsNaN;
473
478 using Base::IsFinite;
479
484 using Base::IsPositiveInfinity;
485
490 using Base::IsNegativeInfinity;
491
496 using Base::IsInfinity;
497
502 using Base::IsNaNOrZero;
503
508 using Base::IsNormal;
509
514 using Base::IsSubnormal;
515
520 using Base::Abs;
521
526 using Base::Negate;
527
536 using Base::AreZero;
537
541 explicit operator float() const noexcept { return ToFloat(); }
542
543 // We do not have an inherited impl for the below operators
544 // as the internal class implements them a little differently
545 bool operator==(const BFloat16_t& rhs) const noexcept;
546 bool operator!=(const BFloat16_t& rhs) const noexcept { return !(*this == rhs); }
547 bool operator<(const BFloat16_t& rhs) const noexcept;
548};
549
550static_assert(sizeof(BFloat16_t) == sizeof(uint16_t), "Sizes must match");
551
558 uint8_t value;
559 constexpr Float8E4M3FN_t() noexcept : value(0) {}
560 constexpr Float8E4M3FN_t(uint8_t v) noexcept : value(v) {}
561 constexpr operator uint8_t() const noexcept { return value; }
562 // nan values are treated like any other value for operator ==, !=
563 constexpr bool operator==(const Float8E4M3FN_t& rhs) const noexcept { return value == rhs.value; };
564 constexpr bool operator!=(const Float8E4M3FN_t& rhs) const noexcept { return value != rhs.value; };
565};
566
567static_assert(sizeof(Float8E4M3FN_t) == sizeof(uint8_t), "Sizes must match");
568
575 uint8_t value;
576 constexpr Float8E4M3FNUZ_t() noexcept : value(0) {}
577 constexpr Float8E4M3FNUZ_t(uint8_t v) noexcept : value(v) {}
578 constexpr operator uint8_t() const noexcept { return value; }
579 // nan values are treated like any other value for operator ==, !=
580 constexpr bool operator==(const Float8E4M3FNUZ_t& rhs) const noexcept { return value == rhs.value; };
581 constexpr bool operator!=(const Float8E4M3FNUZ_t& rhs) const noexcept { return value != rhs.value; };
582};
583
584static_assert(sizeof(Float8E4M3FNUZ_t) == sizeof(uint8_t), "Sizes must match");
585
592 uint8_t value;
593 constexpr Float8E5M2_t() noexcept : value(0) {}
594 constexpr Float8E5M2_t(uint8_t v) noexcept : value(v) {}
595 constexpr operator uint8_t() const noexcept { return value; }
596 // nan values are treated like any other value for operator ==, !=
597 constexpr bool operator==(const Float8E5M2_t& rhs) const noexcept { return value == rhs.value; };
598 constexpr bool operator!=(const Float8E5M2_t& rhs) const noexcept { return value != rhs.value; };
599};
600
601static_assert(sizeof(Float8E5M2_t) == sizeof(uint8_t), "Sizes must match");
602
609 uint8_t value;
610 constexpr Float8E5M2FNUZ_t() noexcept : value(0) {}
611 constexpr Float8E5M2FNUZ_t(uint8_t v) noexcept : value(v) {}
612 constexpr operator uint8_t() const noexcept { return value; }
613 // nan values are treated like any other value for operator ==, !=
614 constexpr bool operator==(const Float8E5M2FNUZ_t& rhs) const noexcept { return value == rhs.value; };
615 constexpr bool operator!=(const Float8E5M2FNUZ_t& rhs) const noexcept { return value != rhs.value; };
616};
617
618static_assert(sizeof(Float8E5M2FNUZ_t) == sizeof(uint8_t), "Sizes must match");
619
620namespace detail {
621// This is used internally by the C++ API. This macro is to make it easy to generate overloaded methods for all of the various OrtRelease* functions for every Ort* type
622// This can't be done in the C API since C doesn't have function overloading.
623#define ORT_DEFINE_RELEASE(NAME) \
624 inline void OrtRelease(Ort##NAME* ptr) { GetApi().Release##NAME(ptr); }
625
626#define ORT_DEFINE_RELEASE_FROM_API_STRUCT(NAME, API_GETTER) \
627 inline void OrtRelease(Ort##NAME* ptr) { API_GETTER().Release##NAME(ptr); }
628
629ORT_DEFINE_RELEASE(Allocator);
630ORT_DEFINE_RELEASE(ArenaCfg);
631ORT_DEFINE_RELEASE(CustomOpDomain);
632ORT_DEFINE_RELEASE(Env);
633ORT_DEFINE_RELEASE(ExternalInitializerInfo);
634ORT_DEFINE_RELEASE(Graph);
635ORT_DEFINE_RELEASE(IoBinding);
636ORT_DEFINE_RELEASE(KernelInfo);
637ORT_DEFINE_RELEASE(KeyValuePairs);
638ORT_DEFINE_RELEASE(LoraAdapter);
639ORT_DEFINE_RELEASE(MemoryInfo);
640ORT_DEFINE_RELEASE(MapTypeInfo);
641ORT_DEFINE_RELEASE(Model);
642ORT_DEFINE_RELEASE(ModelMetadata);
643ORT_DEFINE_RELEASE(Node);
644ORT_DEFINE_RELEASE(Op);
645ORT_DEFINE_RELEASE(OpAttr);
646ORT_DEFINE_RELEASE(PrepackedWeightsContainer);
647ORT_DEFINE_RELEASE(RunOptions);
648ORT_DEFINE_RELEASE(Session);
649ORT_DEFINE_RELEASE(SessionOptions);
650ORT_DEFINE_RELEASE(SequenceTypeInfo);
651ORT_DEFINE_RELEASE(Status);
652ORT_DEFINE_RELEASE(SyncStream);
653ORT_DEFINE_RELEASE(TensorTypeAndShapeInfo);
654ORT_DEFINE_RELEASE(ThreadingOptions);
655ORT_DEFINE_RELEASE(TypeInfo);
656ORT_DEFINE_RELEASE(Value);
657ORT_DEFINE_RELEASE(ValueInfo);
658
659ORT_DEFINE_RELEASE_FROM_API_STRUCT(ModelCompilationOptions, GetCompileApi);
660ORT_DEFINE_RELEASE_FROM_API_STRUCT(EpDevice, GetEpApi);
661ORT_DEFINE_RELEASE_FROM_API_STRUCT(KernelDef, GetEpApi);
662ORT_DEFINE_RELEASE_FROM_API_STRUCT(KernelDefBuilder, GetEpApi);
663ORT_DEFINE_RELEASE_FROM_API_STRUCT(KernelRegistry, GetEpApi);
664
665// This is defined explicitly since OrtTensorRTProviderOptionsV2 is not a C API type,
666// but the struct has V2 in its name to indicate that it is the second version of the options.
669
670#undef ORT_DEFINE_RELEASE
671#undef ORT_DEFINE_RELEASE_FROM_API_STRUCT
672
676template <typename T>
677struct Unowned {
678 using Type = T;
679};
680
700template <typename T>
701struct Base {
702 using contained_type = T;
703
704 constexpr Base() = default;
705 constexpr explicit Base(contained_type* p) noexcept : p_{p} {}
707 OrtRelease(p_);
708 }
709
710 Base(const Base&) = delete;
711 Base& operator=(const Base&) = delete;
712
713 Base(Base&& v) noexcept : p_{v.p_} { v.p_ = nullptr; }
714 Base& operator=(Base&& v) noexcept {
715 OrtRelease(p_);
716 p_ = v.release();
717 return *this;
718 }
719
720 constexpr operator contained_type*() const noexcept { return p_; }
721 constexpr contained_type& operator*() const noexcept { return *p_; }
722
726 T* p = p_;
727 p_ = nullptr;
728 return p;
729 }
730
731 protected:
733};
734
735// Undefined. For const types use Base<Unowned<const T>>
736template <typename T>
737struct Base<const T>;
738
746template <typename T>
747struct Base<Unowned<T>> {
749
750 constexpr Base() = default;
751 constexpr explicit Base(contained_type* p) noexcept : p_{p} {}
752
753 ~Base() = default;
754
755 Base(const Base&) = default;
756 Base& operator=(const Base&) = default;
757
758 Base(Base&& v) noexcept : p_{v.p_} { v.p_ = nullptr; }
759 Base& operator=(Base&& v) noexcept {
760 p_ = nullptr;
761 std::swap(p_, v.p_);
762 return *this;
763 }
764
765 constexpr operator contained_type*() const noexcept { return p_; }
766 constexpr contained_type& operator*() const noexcept { return *p_; }
767
768 protected:
770};
771
772// Light functor to release memory with OrtAllocator
775 explicit AllocatedFree(OrtAllocator* allocator)
776 : allocator_(allocator) {}
777 void operator()(void* ptr) const {
778 if (ptr) allocator_->Free(allocator_, ptr);
779 }
780};
781
782} // namespace detail
783
784struct AllocatorWithDefaultOptions;
785struct Env;
786struct EpDevice;
787struct ExternalInitializerInfo;
788struct Graph;
789struct Model;
790struct Node;
791struct ModelMetadata;
792struct TypeInfo;
793struct PrepackedWeightsContainer;
794struct Session;
795struct SessionOptions;
796struct SyncStream;
797struct TensorRTProviderOptions;
798struct Value;
799struct ValueInfo;
800
805using AllocatedStringPtr = std::unique_ptr<char, detail::AllocatedFree>;
806
811struct Status : detail::Base<OrtStatus> {
812 Status() = default; // Same as with std::nullptr_t. But can be used in re-sizable containers and represent success.
813 explicit Status(std::nullptr_t) noexcept {}
814 explicit Status(OrtStatus* status) noexcept;
815 explicit Status(const Exception&);
816 explicit Status(const std::exception&);
817 Status(const char* message, OrtErrorCode code);
818 std::string GetErrorMessage() const;
820 bool IsOK() const noexcept;
821};
822
852
857struct TensorRTProviderOptions : detail::Base<OrtTensorRTProviderOptionsV2> {
858 TensorRTProviderOptions(std::nullptr_t) {}
862 void Update(const std::unordered_map<std::string, std::string>& options);
864 void UpdateWithValue(const char* key, void* value);
865
867 void* GetOptionByName(const char* name) const;
870};
871
876struct CUDAProviderOptions : detail::Base<OrtCUDAProviderOptionsV2> {
877 CUDAProviderOptions(std::nullptr_t) {}
881 void Update(const std::unordered_map<std::string, std::string>& options);
885 void UpdateWithValue(const char* key, void* value);
887 void* GetOptionByName(const char* name) const;
888};
889
904
905namespace detail {
906template <typename T>
908 using B = Base<T>;
909 using B::B;
910
911 // Wraps OrtApi::ExternalInitializerInfo_GetFilePath
912 const std::basic_string<ORTCHAR_T> GetFilePath() const;
913 // Wraps OrtApi::ExternalInitializerInfo_GetFileOffset
914 int64_t GetFileOffset() const;
915 // Wraps OrtApi::ExternalInitializerInfo_GetByteSize
916 size_t GetByteSize() const;
917};
918} // namespace detail
919
920// Const object holder that does not own the underlying object
923
929 using Base::Base;
930
931 explicit ExternalInitializerInfo(std::nullptr_t) {}
933 : detail::ConstExternalInitializerInfoImpl<OrtExternalInitializerInfo>{p} {}
934
936
938 ExternalInitializerInfo(const ORTCHAR_T* filepath, int64_t file_offset, size_t byte_size);
939
941 static Status Create(const ORTCHAR_T* filepath, int64_t file_offset, size_t byte_size,
942 /*out*/ ExternalInitializerInfo& out);
943};
944
945namespace detail {
946template <typename T>
949 using B::B;
950
951 const char* GetValue(const char* key) const;
952
953 // get the pairs in unordered_map. needs to copy to std::string so the hash works as expected
954 std::unordered_map<std::string, std::string> GetKeyValuePairs() const;
955 // get the pairs in two vectors. entries will be 1:1 between keys and values. avoids copying to std::string
956 void GetKeyValuePairs(std::vector<const char*>& keys, std::vector<const char*>& values) const;
957};
958} // namespace detail
959
960// Const object holder that does not own the underlying object
962
964struct KeyValuePairs : detail::KeyValuePairsImpl<OrtKeyValuePairs> {
965 explicit KeyValuePairs(std::nullptr_t) {}
967 explicit KeyValuePairs(OrtKeyValuePairs* p) : KeyValuePairsImpl<OrtKeyValuePairs>{p} {}
968
970 explicit KeyValuePairs();
971
973 explicit KeyValuePairs(const std::unordered_map<std::string, std::string>& kv_pairs);
974
976 void Add(const char* key, const char* value);
977
979 void Remove(const char* key);
980
981 ConstKeyValuePairs GetConst() const { return ConstKeyValuePairs{this->p_}; }
982};
983
984namespace detail {
985template <typename T>
986struct MemoryInfoImpl : Base<T> {
987 using B = Base<T>;
988 using B::B;
989
990 std::string GetAllocatorName() const;
992 int GetDeviceId() const;
996 uint32_t GetVendorId() const;
997
998 template <typename U>
999 bool operator==(const MemoryInfoImpl<U>& o) const;
1000};
1001} // namespace detail
1002
1003// Const object holder that does not own the underlying object
1005
1009struct MemoryInfo : detail::MemoryInfoImpl<OrtMemoryInfo> {
1011 explicit MemoryInfo(std::nullptr_t) {}
1012 explicit MemoryInfo(OrtMemoryInfo* p) : MemoryInfoImpl<OrtMemoryInfo>{p} {}
1013 MemoryInfo(const char* name, OrtAllocatorType type, int id, OrtMemType mem_type);
1014 MemoryInfo(const char* name, OrtMemoryInfoDeviceType device_type, uint32_t vendor_id, uint32_t device_id,
1015 OrtDeviceMemoryType mem_type, size_t alignment, OrtAllocatorType allocator_type);
1016 ConstMemoryInfo GetConst() const { return ConstMemoryInfo{this->p_}; }
1017};
1018
1026 MemoryAllocation(OrtAllocator* allocator, void* p, size_t size);
1031 MemoryAllocation& operator=(MemoryAllocation&&) noexcept;
1032
1033 void* get() { return p_; }
1034 size_t size() const { return size_; }
1035
1036 private:
1037 OrtAllocator* allocator_;
1038 void* p_;
1039 size_t size_;
1040};
1041
1042namespace detail {
1043template <typename T>
1044struct AllocatorImpl : Base<T> {
1045 using B = Base<T>;
1046 using B::B;
1047
1048 void* Alloc(size_t size);
1049 MemoryAllocation GetAllocation(size_t size);
1050 void Free(void* p);
1051 ConstMemoryInfo GetInfo() const;
1052
1057 KeyValuePairs GetStats() const;
1058};
1059} // namespace detail
1060
1064struct AllocatorWithDefaultOptions : detail::AllocatorImpl<detail::Unowned<OrtAllocator>> {
1065 explicit AllocatorWithDefaultOptions(std::nullptr_t) {}
1067};
1068
1073struct Allocator : detail::AllocatorImpl<OrtAllocator> {
1074 explicit Allocator(std::nullptr_t) {}
1075 Allocator(const Session& session, const OrtMemoryInfo*);
1076
1078 explicit Allocator(OrtAllocator* p) : AllocatorImpl<OrtAllocator>{p} {}
1079};
1080
1081using UnownedAllocator = detail::AllocatorImpl<detail::Unowned<OrtAllocator>>;
1082
1087namespace detail {
1088template <typename T>
1090 using B = Base<T>;
1091 using B::B;
1092 // For some reason this is not a const method on the stream
1093 void* GetHandle();
1094};
1095} // namespace detail
1096
1097struct SyncStream : detail::SyncStreamImpl<OrtSyncStream> {
1099 explicit SyncStream(std::nullptr_t) {}
1101 explicit SyncStream(OrtSyncStream* p) : SyncStreamImpl<OrtSyncStream>{p} {}
1102};
1103
1105
1106namespace detail {
1107template <typename T>
1110 using B::B;
1111
1113 uint32_t VendorId() const;
1114 uint32_t DeviceId() const;
1115 const char* Vendor() const;
1117};
1118} // namespace detail
1119
1124
1125namespace detail {
1126template <typename T>
1129 using B::B;
1130
1131 const char* EpName() const;
1132 const char* EpVendor() const;
1138};
1139} // namespace detail
1140
1145
1148struct EpDevice : detail::EpDeviceImpl<OrtEpDevice> {
1149 explicit EpDevice(std::nullptr_t) {}
1150 explicit EpDevice(OrtEpDevice* p) : EpDeviceImpl<OrtEpDevice>{p} {}
1151
1153 EpDevice(OrtEpFactory& ep_factory, ConstHardwareDevice& hardware_device,
1154 ConstKeyValuePairs ep_metadata = {}, ConstKeyValuePairs ep_options = {});
1155};
1156
1164 const std::vector<ConstEpDevice>& ep_devices,
1165 const char* compatibility_info);
1166
1182AllocatedStringPtr GetCompatibilityInfoFromModelAllocated(const ORTCHAR_T* model_path, const char* ep_type,
1183 OrtAllocator* allocator);
1184
1197AllocatedStringPtr GetCompatibilityInfoFromModelBytesAllocated(const void* model_data, size_t model_data_length,
1198 const char* ep_type, OrtAllocator* allocator);
1199
1200namespace detail {
1201template <typename T>
1204 using B::B;
1205
1206 std::string GetName() const;
1207 std::string GetDomain() const;
1208 std::string GetOperatorType() const;
1209};
1210} // namespace detail
1211
1216
1217namespace detail {
1218template <typename T>
1221 using B::B;
1222
1223 std::string GetEpName() const;
1224 std::vector<ConstEpAssignedNode> GetNodes() const;
1225};
1226} // namespace detail
1227
1232
1238struct Env : detail::Base<OrtEnv> {
1239 explicit Env(std::nullptr_t) {}
1240
1242 Env(OrtLoggingLevel logging_level = ORT_LOGGING_LEVEL_WARNING, _In_ const char* logid = "");
1243
1245 Env(OrtLoggingLevel logging_level, const char* logid, OrtLoggingFunction logging_function, void* logger_param);
1246
1248 Env(const OrtThreadingOptions* tp_options, OrtLoggingLevel logging_level = ORT_LOGGING_LEVEL_WARNING, _In_ const char* logid = "");
1249
1251 Env(const OrtThreadingOptions* tp_options, OrtLoggingFunction logging_function, void* logger_param,
1252 OrtLoggingLevel logging_level = ORT_LOGGING_LEVEL_WARNING, _In_ const char* logid = "");
1253
1255 explicit Env(const OrtEnvCreationOptions* options);
1256
1258 explicit Env(OrtEnv* p) : Base<OrtEnv>{p} {}
1259
1262
1264
1265 Env& CreateAndRegisterAllocator(const OrtMemoryInfo* mem_info, const OrtArenaCfg* arena_cfg);
1266
1267 Env& CreateAndRegisterAllocatorV2(const std::string& provider_type, const OrtMemoryInfo* mem_info,
1268 const std::unordered_map<std::string, std::string>& options,
1269 const OrtArenaCfg* arena_cfg);
1270
1272
1274
1276 OrtAllocatorType allocator_type,
1277 const OrtKeyValuePairs* allocator_options);
1278
1279 // Result may be nullptr
1281
1283 OrtDeviceMemoryType mem_type);
1284
1285 Env& RegisterExecutionProviderLibrary(const char* registration_name, const std::basic_string<ORTCHAR_T>& path);
1286 Env& UnregisterExecutionProviderLibrary(const char* registration_name);
1287
1288 std::vector<ConstEpDevice> GetEpDevices() const;
1289
1290 Status CopyTensors(const std::vector<Value>& src_tensors,
1291 const std::vector<Value>& dst_tensors,
1292 OrtSyncStream* stream) const;
1293};
1294
1298struct CustomOpDomain : detail::Base<OrtCustomOpDomain> {
1300 using Base::Base;
1301
1302 explicit CustomOpDomain(std::nullptr_t) {}
1303
1305 explicit CustomOpDomain(const char* domain);
1306
1307 // This does not take ownership of the op, simply registers it.
1308 void Add(const OrtCustomOp* op);
1309};
1310
1312struct LoraAdapter : detail::Base<OrtLoraAdapter> {
1314 using Base::Base;
1315
1316 explicit LoraAdapter(std::nullptr_t) {}
1323 static LoraAdapter CreateLoraAdapter(const std::basic_string<ORTCHAR_T>& adapter_path,
1324 OrtAllocator* allocator);
1325
1333 static LoraAdapter CreateLoraAdapterFromArray(const void* bytes, size_t num_bytes,
1334 OrtAllocator* allocator);
1335};
1336
1340struct RunOptions : detail::Base<OrtRunOptions> {
1341 explicit RunOptions(std::nullptr_t) {}
1343
1346
1349
1350 RunOptions& SetRunTag(const char* run_tag);
1351 const char* GetRunTag() const;
1352
1353 RunOptions& AddConfigEntry(const char* config_key, const char* config_value);
1354 const char* GetConfigEntry(const char* config_key);
1355
1362
1368
1376
1385};
1386
1387namespace detail {
1388// Utility function that returns a SessionOption config entry key for a specific custom operator.
1389// Ex: custom_op.[custom_op_name].[config]
1390std::string MakeCustomOpConfigEntryKey(const char* custom_op_name, const char* config);
1391} // namespace detail
1392
1403 CustomOpConfigs() = default;
1404 ~CustomOpConfigs() = default;
1409
1418 CustomOpConfigs& AddConfig(const char* custom_op_name, const char* config_key, const char* config_value);
1419
1428 const std::unordered_map<std::string, std::string>& GetFlattenedConfigs() const;
1429
1430 private:
1431 std::unordered_map<std::string, std::string> flat_configs_;
1432};
1433
1439namespace detail {
1440// we separate const-only methods because passing const ptr to non-const methods
1441// is only discovered when inline methods are compiled which is counter-intuitive
1442template <typename T>
1443struct ConstSessionOptionsImpl : Base<T> {
1444 using B = Base<T>;
1445 using B::B;
1446
1447 SessionOptions Clone() const;
1448
1449 std::string GetConfigEntry(const char* config_key) const;
1450 bool HasConfigEntry(const char* config_key) const;
1451 std::string GetConfigEntryOrDefault(const char* config_key, const std::string& def) const;
1452};
1453
1454template <typename T>
1455struct SessionOptionsImpl : ConstSessionOptionsImpl<T> {
1456 using B = ConstSessionOptionsImpl<T>;
1457 using B::B;
1458
1459 SessionOptionsImpl& SetIntraOpNumThreads(int intra_op_num_threads);
1460 SessionOptionsImpl& SetInterOpNumThreads(int inter_op_num_threads);
1461 SessionOptionsImpl& SetGraphOptimizationLevel(GraphOptimizationLevel graph_optimization_level);
1462 SessionOptionsImpl& SetDeterministicCompute(bool value);
1463
1464 SessionOptionsImpl& EnableCpuMemArena();
1465 SessionOptionsImpl& DisableCpuMemArena();
1466
1467 SessionOptionsImpl& SetOptimizedModelFilePath(const ORTCHAR_T* optimized_model_file);
1468
1469 SessionOptionsImpl& EnableProfiling(const ORTCHAR_T* profile_file_prefix);
1470 SessionOptionsImpl& DisableProfiling();
1471
1472 SessionOptionsImpl& EnableOrtCustomOps();
1473
1474 SessionOptionsImpl& EnableMemPattern();
1475 SessionOptionsImpl& DisableMemPattern();
1476
1477 SessionOptionsImpl& SetExecutionMode(ExecutionMode execution_mode);
1478
1479 SessionOptionsImpl& SetLoadCancellationFlag(bool value);
1480
1481 SessionOptionsImpl& SetLogId(const char* logid);
1482 SessionOptionsImpl& SetLogSeverityLevel(int level);
1483
1484 SessionOptionsImpl& Add(OrtCustomOpDomain* custom_op_domain);
1485
1486 SessionOptionsImpl& DisablePerSessionThreads();
1487
1488 SessionOptionsImpl& AddConfigEntry(const char* config_key, const char* config_value);
1489
1490 SessionOptionsImpl& AddInitializer(const char* name, const OrtValue* ort_val);
1491 SessionOptionsImpl& AddExternalInitializers(const std::vector<std::string>& names, const std::vector<Value>& ort_values);
1492 SessionOptionsImpl& AddExternalInitializersFromFilesInMemory(const std::vector<std::basic_string<ORTCHAR_T>>& external_initializer_file_names,
1493 const std::vector<char*>& external_initializer_file_buffer_array,
1494 const std::vector<size_t>& external_initializer_file_lengths);
1495
1496 SessionOptionsImpl& AppendExecutionProvider_CPU(int use_arena);
1497 SessionOptionsImpl& AppendExecutionProvider_CUDA(const OrtCUDAProviderOptions& provider_options);
1498 SessionOptionsImpl& AppendExecutionProvider_CUDA_V2(const OrtCUDAProviderOptionsV2& provider_options);
1499 SessionOptionsImpl& AppendExecutionProvider_ROCM(const OrtROCMProviderOptions& provider_options);
1500 SessionOptionsImpl& AppendExecutionProvider_OpenVINO(const OrtOpenVINOProviderOptions& provider_options);
1502 SessionOptionsImpl& AppendExecutionProvider_OpenVINO_V2(const std::unordered_map<std::string, std::string>& provider_options = {});
1503 SessionOptionsImpl& AppendExecutionProvider_TensorRT(const OrtTensorRTProviderOptions& provider_options);
1504 SessionOptionsImpl& AppendExecutionProvider_TensorRT_V2(const OrtTensorRTProviderOptionsV2& provider_options);
1505 SessionOptionsImpl& AppendExecutionProvider_MIGraphX(const OrtMIGraphXProviderOptions& provider_options);
1507 SessionOptionsImpl& AppendExecutionProvider_CANN(const OrtCANNProviderOptions& provider_options);
1509 SessionOptionsImpl& AppendExecutionProvider_Dnnl(const OrtDnnlProviderOptions& provider_options);
1511 SessionOptionsImpl& AppendExecutionProvider(const std::string& provider_name,
1512 const std::unordered_map<std::string, std::string>& provider_options = {});
1513
1516 SessionOptionsImpl& AppendExecutionProvider_V2(Env& env, const std::vector<ConstEpDevice>& ep_devices,
1517 const KeyValuePairs& ep_options);
1520 SessionOptionsImpl& AppendExecutionProvider_V2(Env& env, const std::vector<ConstEpDevice>& ep_devices,
1521 const std::unordered_map<std::string, std::string>& ep_options);
1522
1524 SessionOptionsImpl& SetEpSelectionPolicy(OrtExecutionProviderDevicePolicy policy);
1525
1527 SessionOptionsImpl& SetEpSelectionPolicy(EpSelectionDelegate delegate, void* state = nullptr);
1528
1529 SessionOptionsImpl& SetCustomCreateThreadFn(OrtCustomCreateThreadFn ort_custom_create_thread_fn);
1530 SessionOptionsImpl& SetCustomThreadCreationOptions(void* ort_custom_thread_creation_options);
1531 SessionOptionsImpl& SetCustomJoinThreadFn(OrtCustomJoinThreadFn ort_custom_join_thread_fn);
1532
1536 SessionOptionsImpl& RegisterCustomOpsLibrary(const ORTCHAR_T* library_name, const CustomOpConfigs& custom_op_configs = {});
1537
1538 SessionOptionsImpl& RegisterCustomOpsUsingFunction(const char* function_name);
1539
1541 SessionOptionsImpl& AppendExecutionProvider_VitisAI(const std::unordered_map<std::string, std::string>& provider_options = {});
1542
1544 SessionOptionsImpl& AddFreeDimensionOverride(const char* dim_denotation, int64_t dim_value);
1545
1547 SessionOptionsImpl& AddFreeDimensionOverrideByName(const char* dim_name, int64_t dim_value);
1548};
1549} // namespace detail
1550
1551using UnownedSessionOptions = detail::SessionOptionsImpl<detail::Unowned<OrtSessionOptions>>;
1552using ConstSessionOptions = detail::ConstSessionOptionsImpl<detail::Unowned<const OrtSessionOptions>>;
1553
1557struct SessionOptions : detail::SessionOptionsImpl<OrtSessionOptions> {
1558 explicit SessionOptions(std::nullptr_t) {}
1560 explicit SessionOptions(OrtSessionOptions* p) : SessionOptionsImpl<OrtSessionOptions>{p} {}
1563};
1564
1569struct ModelCompilationOptions : detail::Base<OrtModelCompilationOptions> {
1571 using Base::Base;
1572
1573 explicit ModelCompilationOptions(std::nullptr_t) {}
1574
1575 ModelCompilationOptions(const Env& env, const SessionOptions& session_options);
1576 ModelCompilationOptions(const Env& env, ConstSessionOptions session_options);
1577
1578 ModelCompilationOptions& SetInputModelPath(const ORTCHAR_T* input_model_path);
1580 size_t input_model_data_size);
1581 ModelCompilationOptions& SetEpContextEmbedMode(bool embed_ep_context_in_model);
1582 ModelCompilationOptions& SetOutputModelPath(const ORTCHAR_T* output_model_path);
1584 size_t initializer_size_threshold);
1585
1588 OrtGetInitializerLocationFunc get_initializer_location_func,
1589 void* state);
1590
1591 ModelCompilationOptions& SetOutputModelBuffer(OrtAllocator* allocator, void** output_model_buffer_ptr,
1592 size_t* output_model_buffer_size_ptr);
1593
1596
1597 ModelCompilationOptions& SetEpContextBinaryInformation(const ORTCHAR_T* output_directory,
1598 const ORTCHAR_T* model_name);
1600
1602};
1603
1610Status CompileModel(const Env& env, const ModelCompilationOptions& model_compilation_options);
1611
1615struct ModelMetadata : detail::Base<OrtModelMetadata> {
1617 using Base::Base;
1618
1619 explicit ModelMetadata(std::nullptr_t) {}
1620
1628
1636
1644
1652
1660
1667 std::vector<AllocatedStringPtr> GetCustomMetadataMapKeysAllocated(OrtAllocator* allocator) const;
1668
1679
1680 int64_t GetVersion() const;
1681};
1682
1683struct IoBinding;
1684
1685namespace detail {
1686
1687// we separate const-only methods because passing const ptr to non-const methods
1688// is only discovered when inline methods are compiled which is counter-intuitive
1689template <typename T>
1691 using B = Base<T>;
1692 using B::B;
1693
1694 size_t GetInputCount() const;
1695 size_t GetOutputCount() const;
1697
1698 std::vector<std::string> GetInputNames() const;
1699 std::vector<std::string> GetOutputNames() const;
1700 std::vector<std::string> GetOverridableInitializerNames() const;
1701
1702 std::vector<ConstMemoryInfo> GetMemoryInfoForInputs() const;
1703 std::vector<ConstMemoryInfo> GetMemoryInfoForOutputs() const;
1704 std::vector<ConstEpDevice> GetEpDeviceForInputs() const;
1705 std::vector<ConstEpDevice> GetEpDeviceForOutputs() const;
1706
1715
1724
1733
1734 uint64_t GetProfilingStartTimeNs() const;
1736
1737 TypeInfo GetInputTypeInfo(size_t index) const;
1738 TypeInfo GetOutputTypeInfo(size_t index) const;
1740
1741 int GetOpset(const std::string& domain) const;
1742
1743 std::vector<ValueInfo> GetInputs() const;
1744 std::vector<ValueInfo> GetOutputs() const;
1745
1750 std::vector<ConstEpAssignedSubgraph> GetEpGraphAssignmentInfo() const;
1751};
1752
1753template <typename T>
1756 using B::B;
1757
1775 std::vector<Value> Run(const RunOptions& run_options, const char* const* input_names, const Value* input_values, size_t input_count,
1776 const char* const* output_names, size_t output_count);
1777
1781 void Run(const RunOptions& run_options, const char* const* input_names, const Value* input_values, size_t input_count,
1782 const char* const* output_names, Value* output_values, size_t output_count);
1783
1784 void Run(const RunOptions& run_options, const IoBinding&);
1785
1805 void RunAsync(const RunOptions& run_options, const char* const* input_names, const Value* input_values, size_t input_count,
1806 const char* const* output_names, Value* output_values, size_t output_count, RunAsyncCallbackFn callback, void* user_data);
1807
1815
1827 void SetEpDynamicOptions(const char* const* keys, const char* const* values, size_t kv_len);
1828
1829 void FinalizeModelEditorSession(const Model& model, const SessionOptions& options,
1830 OrtPrepackedWeightsContainer* prepacked_weights_container = nullptr);
1831};
1832
1833} // namespace detail
1834
1837
1841struct Session : detail::SessionImpl<OrtSession> {
1843 explicit Session(std::nullptr_t) {}
1844 explicit Session(OrtSession* p) : SessionImpl{p} {}
1845
1846 Session(const Env& env, const ORTCHAR_T* model_path, const SessionOptions& options);
1847
1849 Session(const Env& env, const ORTCHAR_T* model_path, const SessionOptions& options,
1850 OrtPrepackedWeightsContainer* prepacked_weights_container);
1851
1853 Session(const Env& env, const void* model_data, size_t model_data_length, const SessionOptions& options);
1854
1856 Session(const Env& env, const void* model_data, size_t model_data_length, const SessionOptions& options,
1857 OrtPrepackedWeightsContainer* prepacked_weights_container);
1858
1859#if !defined(ORT_MINIMAL_BUILD)
1861 Session(const Env& env, const Model& model, const SessionOptions& options);
1862
1864 static Session CreateModelEditorSession(const Env& env, const ORTCHAR_T* model_path, const SessionOptions& options);
1865
1867 static Session CreateModelEditorSession(const Env& env, const void* model_data, size_t model_data_length,
1868 const SessionOptions& options);
1869#endif // !defined(ORT_MINIMAL_BUILD)
1870
1871 ConstSession GetConst() const { return ConstSession{this->p_}; }
1872 UnownedSession GetUnowned() const { return UnownedSession{this->p_}; }
1873};
1874
1875namespace detail {
1876template <typename T>
1878 using B = Base<T>;
1879 using B::B;
1880
1882 size_t GetElementCount() const;
1883
1884 size_t GetDimensionsCount() const;
1885
1890 [[deprecated("use GetShape()")]] void GetDimensions(int64_t* values, size_t values_count) const;
1891
1892 void GetSymbolicDimensions(const char** values, size_t values_count) const;
1893 std::vector<const char*> GetSymbolicDimensions() const;
1894
1895 bool HasShape() const;
1896 std::vector<int64_t> GetShape() const;
1897};
1898
1899} // namespace detail
1900
1902
1908 using Base::Base;
1909
1911 explicit TensorTypeAndShapeInfo(std::nullptr_t) {}
1913 explicit TensorTypeAndShapeInfo(OrtTensorTypeAndShapeInfo* p) : TensorTypeAndShapeInfoImpl{p} {}
1914
1915 // Create a TensorTypeAndShapeInfo object with the specified element type and dimensions
1916 // symbolic_dims are optional, but should be 1:1 with dims.
1917 // The value in symbolic_dims will be used for all entries in dims that are -1.
1919 const std::vector<int64_t>& dims,
1920 const std::vector<std::string>* symbolic_dims = nullptr);
1921
1923};
1924
1925namespace detail {
1926template <typename T>
1928 using B = Base<T>;
1929 using B::B;
1931};
1932
1933} // namespace detail
1934
1936
1940struct SequenceTypeInfo : detail::SequenceTypeInfoImpl<OrtSequenceTypeInfo> {
1942 using Base::Base;
1943
1944 explicit SequenceTypeInfo(std::nullptr_t) {}
1945 explicit SequenceTypeInfo(OrtSequenceTypeInfo* p) : SequenceTypeInfoImpl<OrtSequenceTypeInfo>{p} {}
1947};
1948
1949namespace detail {
1950template <typename T>
1952 using B = Base<T>;
1953 using B::B;
1955};
1956
1957} // namespace detail
1958
1959// This is always owned by the TypeInfo and can only be obtained from it.
1961
1962namespace detail {
1963template <typename T>
1970
1971} // namespace detail
1972
1974
1978struct MapTypeInfo : detail::MapTypeInfoImpl<OrtMapTypeInfo> {
1980 using Base::Base;
1981
1982 explicit MapTypeInfo(std::nullptr_t) {}
1983 explicit MapTypeInfo(OrtMapTypeInfo* p) : MapTypeInfoImpl<OrtMapTypeInfo>{p} {}
1984 ConstMapTypeInfo GetConst() const { return ConstMapTypeInfo{this->p_}; }
1985};
1986
1987namespace detail {
1988template <typename T>
2000} // namespace detail
2001
2007
2012struct TypeInfo : detail::TypeInfoImpl<OrtTypeInfo> {
2014 using Base::Base;
2015
2017 explicit TypeInfo(std::nullptr_t) {}
2018 explicit TypeInfo(OrtTypeInfo* p) : TypeInfoImpl<OrtTypeInfo>{p} {}
2019
2020#if !defined(ORT_MINIMAL_BUILD)
2026#endif // !defined(ORT_MINIMAL_BUILD)
2027
2028 ConstTypeInfo GetConst() const { return ConstTypeInfo{this->p_}; }
2029};
2030
2031namespace detail {
2032// This structure is used to feed sparse tensor values
2033// information for use with FillSparseTensor<Format>() API
2034// if the data type for the sparse tensor values is numeric
2035// use data.p_data, otherwise, use data.str pointer to feed
2036// values. data.str is an array of const char* that are zero terminated.
2037// number of strings in the array must match shape size.
2038// For fully sparse tensors use shape {0} and set p_data/str
2039// to nullptr.
2041 const int64_t* values_shape;
2043 union {
2044 const void* p_data;
2045 const char** str;
2046 } data;
2047};
2048
2049// Provides a way to pass shape in a single
2050// argument
2051struct Shape {
2052 const int64_t* shape;
2054};
2055
2056template <typename T>
2058 using B = Base<T>;
2059 using B::B;
2060
2064 template <typename R>
2065 void GetOpaqueData(const char* domain, const char* type_name, R&) const;
2066
2067 bool IsTensor() const;
2068 bool HasValue() const;
2069
2070 size_t GetCount() const; // If a non tensor, returns 2 for map and N for sequence, where N is the number of elements
2071 Value GetValue(int index, OrtAllocator* allocator) const;
2072
2080
2095 void GetStringTensorContent(void* buffer, size_t buffer_length, size_t* offsets, size_t offsets_count) const;
2096
2103 template <typename R>
2104 const R* GetTensorData() const;
2105
2110 const void* GetTensorRawData() const;
2111
2119
2127
2133
2142 void GetStringTensorElement(size_t buffer_length, size_t element_index, void* buffer) const;
2143
2150 std::string GetStringTensorElement(size_t element_index) const;
2151
2158 size_t GetStringTensorElementLength(size_t element_index) const;
2159
2166 size_t GetTensorSizeInBytes() const;
2167
2168#if !defined(DISABLE_SPARSE_TENSORS)
2176
2183
2192
2202 template <typename R>
2203 const R* GetSparseTensorIndicesData(OrtSparseIndicesFormat indices_format, size_t& num_indices) const;
2204
2209 bool IsSparseTensor() const;
2210
2219 template <typename R>
2220 const R* GetSparseTensorValues() const;
2221
2222#endif
2223};
2224
2225template <typename T>
2228 using B::B;
2229
2235 template <typename R>
2237
2243
2245 // Obtain a reference to an element of data at the location specified
2251 template <typename R>
2252 R& At(const std::vector<int64_t>& location);
2253
2259 void FillStringTensor(const char* const* s, size_t s_len);
2260
2266 void FillStringTensorElement(const char* s, size_t index);
2267
2280 char* GetResizedStringTensorElementBuffer(size_t index, size_t buffer_length);
2281
2282#if !defined(DISABLE_SPARSE_TENSORS)
2291 void UseCooIndices(int64_t* indices_data, size_t indices_num);
2292
2303 void UseCsrIndices(int64_t* inner_data, size_t inner_num, int64_t* outer_data, size_t outer_num);
2304
2313 void UseBlockSparseIndices(const Shape& indices_shape, int32_t* indices_data);
2314
2324 void FillSparseTensorCoo(const OrtMemoryInfo* data_mem_info, const OrtSparseValuesParam& values_param,
2325 const int64_t* indices_data, size_t indices_num);
2326
2338 void FillSparseTensorCsr(const OrtMemoryInfo* data_mem_info,
2339 const OrtSparseValuesParam& values,
2340 const int64_t* inner_indices_data, size_t inner_indices_num,
2341 const int64_t* outer_indices_data, size_t outer_indices_num);
2342
2353 const OrtSparseValuesParam& values,
2354 const Shape& indices_shape,
2355 const int32_t* indices_data);
2356
2357#endif
2358};
2359
2360} // namespace detail
2361
2364
2368struct Value : detail::ValueImpl<OrtValue> {
2370 using Base::Base;
2373
2374 Value(std::nullptr_t) {}
2375 Value(Value&&) = default;
2376 Value& operator=(Value&&) = default;
2377
2378 ConstValue GetConst() const { return ConstValue{this->p_}; }
2379 UnownedValue GetUnowned() const { return UnownedValue{this->p_}; }
2380
2389 template <typename T>
2390 static Value CreateTensor(const OrtMemoryInfo* info, T* p_data, size_t p_data_element_count,
2391 const int64_t* shape, size_t shape_len);
2392
2402 static Value CreateTensor(const OrtMemoryInfo* info, void* p_data, size_t p_data_byte_count,
2403 const int64_t* shape, size_t shape_len,
2405
2415 static Value CreateTensor(OrtAllocator* deleter, void* p_data, size_t p_data_byte_count,
2416 const int64_t* shape, size_t shape_len,
2418
2430 template <typename T>
2431 static Value CreateTensor(OrtAllocator* allocator, const int64_t* shape, size_t shape_len);
2432
2444 static Value CreateTensor(OrtAllocator* allocator, const int64_t* shape, size_t shape_len,
2446
2455 static Value CreateMap(const Value& keys, const Value& values);
2456
2464 static Value CreateSequence(const std::vector<Value>& values);
2465
2474 template <typename T>
2475 static Value CreateOpaque(const char* domain, const char* type_name, const T& value);
2476
2477#if !defined(DISABLE_SPARSE_TENSORS)
2488 template <typename T>
2489 static Value CreateSparseTensor(const OrtMemoryInfo* info, T* p_data, const Shape& dense_shape,
2490 const Shape& values_shape);
2491
2508 static Value CreateSparseTensor(const OrtMemoryInfo* info, void* p_data, const Shape& dense_shape,
2509 const Shape& values_shape, ONNXTensorElementDataType type);
2510
2520 template <typename T>
2521 static Value CreateSparseTensor(OrtAllocator* allocator, const Shape& dense_shape);
2522
2534 static Value CreateSparseTensor(OrtAllocator* allocator, const Shape& dense_shape, ONNXTensorElementDataType type);
2535
2536#endif // !defined(DISABLE_SPARSE_TENSORS)
2537};
2538
2539namespace detail {
2540namespace binding_utils {
2541// Bring these out of template
2542std::vector<std::string> GetOutputNamesHelper(const OrtIoBinding* binding, OrtAllocator*);
2543std::vector<Value> GetOutputValuesHelper(const OrtIoBinding* binding, OrtAllocator*);
2544} // namespace binding_utils
2545
2546template <typename T>
2548 using B = Base<T>;
2549 using B::B;
2550
2551 std::vector<std::string> GetOutputNames() const;
2552 std::vector<std::string> GetOutputNames(OrtAllocator*) const;
2553 std::vector<Value> GetOutputValues() const;
2554 std::vector<Value> GetOutputValues(OrtAllocator*) const;
2555};
2556
2557template <typename T>
2560 using B::B;
2561
2562 void BindInput(const char* name, const Value&);
2563 void BindOutput(const char* name, const Value&);
2564 void BindOutput(const char* name, const OrtMemoryInfo*);
2569};
2570
2571} // namespace detail
2572
2575
2579struct IoBinding : detail::IoBindingImpl<OrtIoBinding> {
2580 explicit IoBinding(std::nullptr_t) {}
2581 explicit IoBinding(Session& session);
2582 ConstIoBinding GetConst() const { return ConstIoBinding{this->p_}; }
2583 UnownedIoBinding GetUnowned() const { return UnownedIoBinding{this->p_}; }
2584};
2585
2590struct ArenaCfg : detail::Base<OrtArenaCfg> {
2591 explicit ArenaCfg(std::nullptr_t) {}
2600 ArenaCfg(size_t max_mem, int arena_extend_strategy, int initial_chunk_size_bytes, int max_dead_bytes_per_chunk);
2601
2606 explicit ArenaCfg(const std::unordered_map<std::string, size_t>& arena_config);
2607};
2608
2609//
2610// Custom OPs (only needed to implement custom OPs)
2611//
2612
2613namespace detail {
2614// Need to define a templated ConstOpAttr with const members
2615template <typename T>
2618 using B::B;
2619
2620 // Wraps OrtApi::OpAttr_GetName
2621 std::string GetName() const;
2622 // Wraps OrtApi::OpAttr_GetType
2624
2625 // Wraps OrtApi::ReadAttr for a single value
2626 // This does not support Tensor Attribute
2627 // Call GetTensorAttributeAsOrtValue() instead.
2628 template <typename R>
2629 Status GetValue(R& out) const;
2630
2631 // Wraps OrtApi::ReadAttr for an array of values
2632 template <typename R>
2633 Status GetValueArray(std::vector<R>& out) const;
2634 // Wraps OrtApi::OpAttr_GetTensorAttributeAsOrtValue
2636};
2637} // namespace detail
2638
2640
2644struct OpAttr : detail::ConstOpAttrImpl<OrtOpAttr> {
2646 using Base::Base;
2647
2648 OpAttr() = default; // Enable storing it in the container for resize()
2649 explicit OpAttr(std::nullptr_t) {}
2650 OpAttr(const char* name, const void* data, int len, OrtOpAttrType type);
2651
2652 ConstOpAttr GetConst() const { return ConstOpAttr{this->p_}; }
2653};
2654
2663#define ORT_CXX_LOG(logger, message_severity, message) \
2664 do { \
2665 if (message_severity >= logger.GetLoggingSeverityLevel()) { \
2666 Ort::ThrowOnError(logger.LogMessage(message_severity, ORT_FILE, __LINE__, \
2667 static_cast<const char*>(__FUNCTION__), message)); \
2668 } \
2669 } while (false)
2670
2679#define ORT_CXX_LOG_NOEXCEPT(logger, message_severity, message) \
2680 do { \
2681 if (message_severity >= logger.GetLoggingSeverityLevel()) { \
2682 static_cast<void>(logger.LogMessage(message_severity, ORT_FILE, __LINE__, \
2683 static_cast<const char*>(__FUNCTION__), message)); \
2684 } \
2685 } while (false)
2686
2698#define ORT_CXX_LOGF(logger, message_severity, /*format,*/...) \
2699 do { \
2700 if (message_severity >= logger.GetLoggingSeverityLevel()) { \
2701 Ort::ThrowOnError(logger.LogFormattedMessage(message_severity, ORT_FILE, __LINE__, \
2702 static_cast<const char*>(__FUNCTION__), __VA_ARGS__)); \
2703 } \
2704 } while (false)
2705
2717#define ORT_CXX_LOGF_NOEXCEPT(logger, message_severity, /*format,*/...) \
2718 do { \
2719 if (message_severity >= logger.GetLoggingSeverityLevel()) { \
2720 static_cast<void>(logger.LogFormattedMessage(message_severity, ORT_FILE, __LINE__, \
2721 static_cast<const char*>(__FUNCTION__), __VA_ARGS__)); \
2722 } \
2723 } while (false)
2724
2735struct Logger {
2739 Logger() = default;
2740
2744 explicit Logger(std::nullptr_t) {}
2745
2752 explicit Logger(const OrtLogger* logger);
2753
2754 ~Logger() = default;
2755
2756 Logger(const Logger&) = default;
2757 Logger& operator=(const Logger&) = default;
2758
2759 Logger(Logger&& v) noexcept = default;
2760 Logger& operator=(Logger&& v) noexcept = default;
2761
2768
2781 Status LogMessage(OrtLoggingLevel log_severity_level, const ORTCHAR_T* file_path, int line_number,
2782 const char* func_name, const char* message) const noexcept;
2783
2798 template <typename... Args>
2799 Status LogFormattedMessage(OrtLoggingLevel log_severity_level, const ORTCHAR_T* file_path, int line_number,
2800 const char* func_name, const char* format, Args&&... args) const noexcept;
2801
2802 private:
2803 const OrtLogger* logger_{};
2804 OrtLoggingLevel cached_severity_level_{};
2805};
2806
2815 size_t GetInputCount() const;
2816 size_t GetOutputCount() const;
2817 // If input is optional and is not present, the method returns an empty ConstValue
2818 // which can be compared to nullptr.
2819 ConstValue GetInput(size_t index) const;
2820 // If output is optional and is not present, the method returns an empty UnownedValue
2821 // which can be compared to nullptr.
2822 UnownedValue GetOutput(size_t index, const int64_t* dim_values, size_t dim_count) const;
2823 UnownedValue GetOutput(size_t index, const std::vector<int64_t>& dims) const;
2824 void* GetGPUComputeStream() const;
2826 Ort::Allocator GetAllocator(const OrtMemoryInfo& memory_info) const;
2827 OrtKernelContext* GetOrtKernelContext() const { return ctx_; }
2828 void ParallelFor(void (*fn)(void*, size_t), size_t total, size_t num_batch, void* usr_data) const;
2829
2830 private:
2831 OrtKernelContext* ctx_;
2832};
2833
2834struct KernelInfo;
2835
2836namespace detail {
2837namespace attr_utils {
2838void GetAttr(const OrtKernelInfo* p, const char* name, float&);
2839void GetAttr(const OrtKernelInfo* p, const char* name, int64_t&);
2840void GetAttr(const OrtKernelInfo* p, const char* name, std::string&);
2841void GetAttrs(const OrtKernelInfo* p, const char* name, std::vector<float>&);
2842void GetAttrs(const OrtKernelInfo* p, const char* name, std::vector<int64_t>&);
2843} // namespace attr_utils
2844
2845template <typename T>
2846struct KernelInfoImpl : Base<T> {
2847 using B = Base<T>;
2848 using B::B;
2849
2850 KernelInfo Copy() const;
2851
2852 template <typename R> // R is only implemented for float, int64_t, and string
2853 R GetAttribute(const char* name) const {
2854 R val;
2855 attr_utils::GetAttr(this->p_, name, val);
2856 return val;
2857 }
2858
2859 template <typename R> // R is only implemented for std::vector<float>, std::vector<int64_t>
2860 std::vector<R> GetAttributes(const char* name) const {
2861 std::vector<R> result;
2862 attr_utils::GetAttrs(this->p_, name, result);
2863 return result;
2864 }
2865
2866 Value GetTensorAttribute(const char* name, OrtAllocator* allocator) const;
2867
2868 size_t GetInputCount() const;
2869 size_t GetOutputCount() const;
2870
2871 std::string GetInputName(size_t index) const;
2872 std::string GetOutputName(size_t index) const;
2873
2874 TypeInfo GetInputTypeInfo(size_t index) const;
2875 TypeInfo GetOutputTypeInfo(size_t index) const;
2876
2877 ConstValue GetTensorConstantInput(size_t index, int* is_constant) const;
2878
2879 std::string GetNodeName() const;
2880 Logger GetLogger() const;
2881
2882 KeyValuePairs GetConfigEntries() const;
2883
2884 std::string GetOperatorDomain() const;
2885 std::string GetOperatorType() const;
2886 int GetOperatorSinceVersion() const;
2887 const OrtEp* GetEp() const;
2888};
2889
2890} // namespace detail
2891
2892using ConstKernelInfo = detail::KernelInfoImpl<detail::Unowned<const OrtKernelInfo>>;
2893
2900struct KernelInfo : detail::KernelInfoImpl<OrtKernelInfo> {
2901 using Base = detail::KernelInfoImpl<OrtKernelInfo>;
2902 using Base::Base;
2903 explicit KernelInfo(std::nullptr_t) {}
2904 explicit KernelInfo(OrtKernelInfo* info);
2905 ConstKernelInfo GetConst() const { return ConstKernelInfo{this->p_}; }
2906};
2907
2911struct Op : detail::Base<OrtOp> {
2913 using Base::Base;
2914
2915 explicit Op(std::nullptr_t) {}
2916
2917 explicit Op(OrtOp*);
2918
2919 static Op Create(const OrtKernelInfo* info, const char* op_name, const char* domain,
2920 int version, const char** type_constraint_names,
2921 const ONNXTensorElementDataType* type_constraint_values,
2922 size_t type_constraint_count,
2923 const OpAttr* attr_values,
2924 size_t attr_count,
2925 size_t input_count, size_t output_count);
2926
2927 void Invoke(const OrtKernelContext* context,
2928 const Value* input_values,
2929 size_t input_count,
2930 Value* output_values,
2931 size_t output_count);
2932
2933 // For easier refactoring
2934 void Invoke(const OrtKernelContext* context,
2935 const OrtValue* const* input_values,
2936 size_t input_count,
2937 OrtValue* const* output_values,
2938 size_t output_count);
2939};
2940
2946 SymbolicInteger(int64_t i) : i_(i), is_int_(true) {};
2947 SymbolicInteger(const char* s) : s_(s), is_int_(false) {};
2950
2953
2954 bool operator==(const SymbolicInteger& dim) const {
2955 if (is_int_ == dim.is_int_) {
2956 if (is_int_) {
2957 return i_ == dim.i_;
2958 } else {
2959 return std::string{s_} == std::string{dim.s_};
2960 }
2961 }
2962 return false;
2963 }
2964
2965 bool IsInt() const { return is_int_; }
2966 int64_t AsInt() const { return i_; }
2967 const char* AsSym() const { return s_; }
2968
2969 static constexpr int INVALID_INT_DIM = -2;
2970
2971 private:
2972 union {
2973 int64_t i_;
2974 const char* s_;
2975 };
2976 bool is_int_;
2977 };
2978
2979 using Shape = std::vector<SymbolicInteger>;
2980
2982
2983 const Shape& GetInputShape(size_t indice) const { return input_shapes_.at(indice); }
2984
2985 size_t GetInputCount() const { return input_shapes_.size(); }
2986
2988
2989 int64_t GetAttrInt(const char* attr_name);
2990
2991 using Ints = std::vector<int64_t>;
2992 Ints GetAttrInts(const char* attr_name);
2993
2994 float GetAttrFloat(const char* attr_name);
2995
2996 using Floats = std::vector<float>;
2997 Floats GetAttrFloats(const char* attr_name);
2998
2999 std::string GetAttrString(const char* attr_name);
3000
3001 using Strings = std::vector<std::string>;
3002 Strings GetAttrStrings(const char* attr_name);
3003
3004 private:
3005 ConstOpAttr GetAttrHdl(const char* attr_name) const;
3006 const OrtApi* ort_api_;
3008 std::vector<Shape> input_shapes_;
3009};
3010
3012
3013#define MAX_CUSTOM_OP_END_VER (1UL << 31) - 1
3014
3015template <typename TOp, typename TKernel, bool WithStatus = false>
3019 OrtCustomOp::GetName = [](const OrtCustomOp* this_) { return static_cast<const TOp*>(this_)->GetName(); };
3020
3021 OrtCustomOp::GetExecutionProviderType = [](const OrtCustomOp* this_) { return static_cast<const TOp*>(this_)->GetExecutionProviderType(); };
3022
3023 OrtCustomOp::GetInputTypeCount = [](const OrtCustomOp* this_) { return static_cast<const TOp*>(this_)->GetInputTypeCount(); };
3024 OrtCustomOp::GetInputType = [](const OrtCustomOp* this_, size_t index) { return static_cast<const TOp*>(this_)->GetInputType(index); };
3025 OrtCustomOp::GetInputMemoryType = [](const OrtCustomOp* this_, size_t index) { return static_cast<const TOp*>(this_)->GetInputMemoryType(index); };
3026
3027 OrtCustomOp::GetOutputTypeCount = [](const OrtCustomOp* this_) { return static_cast<const TOp*>(this_)->GetOutputTypeCount(); };
3028 OrtCustomOp::GetOutputType = [](const OrtCustomOp* this_, size_t index) { return static_cast<const TOp*>(this_)->GetOutputType(index); };
3029
3030#if defined(_MSC_VER) && !defined(__clang__)
3031#pragma warning(push)
3032#pragma warning(disable : 26409)
3033#endif
3034 OrtCustomOp::KernelDestroy = [](void* op_kernel) { delete static_cast<TKernel*>(op_kernel); };
3035#if defined(_MSC_VER) && !defined(__clang__)
3036#pragma warning(pop)
3037#endif
3038 OrtCustomOp::GetInputCharacteristic = [](const OrtCustomOp* this_, size_t index) { return static_cast<const TOp*>(this_)->GetInputCharacteristic(index); };
3039 OrtCustomOp::GetOutputCharacteristic = [](const OrtCustomOp* this_, size_t index) { return static_cast<const TOp*>(this_)->GetOutputCharacteristic(index); };
3040
3041 OrtCustomOp::GetVariadicInputMinArity = [](const OrtCustomOp* this_) { return static_cast<const TOp*>(this_)->GetVariadicInputMinArity(); };
3042 OrtCustomOp::GetVariadicInputHomogeneity = [](const OrtCustomOp* this_) { return static_cast<int>(static_cast<const TOp*>(this_)->GetVariadicInputHomogeneity()); };
3043 OrtCustomOp::GetVariadicOutputMinArity = [](const OrtCustomOp* this_) { return static_cast<const TOp*>(this_)->GetVariadicOutputMinArity(); };
3044 OrtCustomOp::GetVariadicOutputHomogeneity = [](const OrtCustomOp* this_) { return static_cast<int>(static_cast<const TOp*>(this_)->GetVariadicOutputHomogeneity()); };
3045#ifdef __cpp_if_constexpr
3046 if constexpr (WithStatus) {
3047#else
3048 if (WithStatus) {
3049#endif
3050 OrtCustomOp::CreateKernelV2 = [](const OrtCustomOp* this_, const OrtApi* api, const OrtKernelInfo* info, void** op_kernel) -> OrtStatusPtr {
3051 return static_cast<const TOp*>(this_)->CreateKernelV2(*api, info, op_kernel);
3052 };
3053 OrtCustomOp::KernelComputeV2 = [](void* op_kernel, OrtKernelContext* context) -> OrtStatusPtr {
3054 return static_cast<TKernel*>(op_kernel)->ComputeV2(context);
3055 };
3056 } else {
3059
3060 OrtCustomOp::CreateKernel = [](const OrtCustomOp* this_, const OrtApi* api, const OrtKernelInfo* info) { return static_cast<const TOp*>(this_)->CreateKernel(*api, info); };
3061 OrtCustomOp::KernelCompute = [](void* op_kernel, OrtKernelContext* context) {
3062 static_cast<TKernel*>(op_kernel)->Compute(context);
3063 };
3064 }
3065
3066 SetShapeInferFn<TOp>(0);
3067
3068 OrtCustomOp::GetStartVersion = [](const OrtCustomOp* this_) {
3069 return static_cast<const TOp*>(this_)->start_ver_;
3070 };
3071
3072 OrtCustomOp::GetEndVersion = [](const OrtCustomOp* this_) {
3073 return static_cast<const TOp*>(this_)->end_ver_;
3074 };
3075
3078 OrtCustomOp::GetAliasMap = nullptr;
3080 }
3081
3082 // Default implementation of GetExecutionProviderType that returns nullptr to default to the CPU provider
3083 const char* GetExecutionProviderType() const { return nullptr; }
3084
3085 // Default implementations of GetInputCharacteristic() and GetOutputCharacteristic() below
3086 // (inputs and outputs are required by default)
3088 return OrtCustomOpInputOutputCharacteristic::INPUT_OUTPUT_REQUIRED;
3089 }
3090
3092 return OrtCustomOpInputOutputCharacteristic::INPUT_OUTPUT_REQUIRED;
3093 }
3094
3095 // Default implementation of GetInputMemoryType() that returns OrtMemTypeDefault
3096 OrtMemType GetInputMemoryType(size_t /*index*/) const {
3097 return OrtMemTypeDefault;
3098 }
3099
3100 // Default implementation of GetVariadicInputMinArity() returns 1 to specify that a variadic input
3101 // should expect at least 1 argument.
3103 return 1;
3104 }
3105
3106 // Default implementation of GetVariadicInputHomegeneity() returns true to specify that all arguments
3107 // to a variadic input should be of the same type.
3109 return true;
3110 }
3111
3112 // Default implementation of GetVariadicOutputMinArity() returns 1 to specify that a variadic output
3113 // should produce at least 1 output value.
3115 return 1;
3116 }
3117
3118 // Default implementation of GetVariadicOutputHomegeneity() returns true to specify that all output values
3119 // produced by a variadic output should be of the same type.
3121 return true;
3122 }
3123
3124 // Declare list of session config entries used by this Custom Op.
3125 // Implement this function in order to get configs from CustomOpBase::GetSessionConfigs().
3126 // This default implementation returns an empty vector of config entries.
3127 std::vector<std::string> GetSessionConfigKeys() const {
3128 return std::vector<std::string>{};
3129 }
3130
3131 // Ort::CustomOpBase derived class should provide the following static method with the type/shape inferencing
3132 // implementation if needed:
3133 // static OrtStatusPtr InferOutputShape(Ort::ShapeInferContext& context)
3134 template <typename C>
3135 decltype(&C::InferOutputShape) SetShapeInferFn(decltype(&C::InferOutputShape)) {
3137 ShapeInferContext ctx(&GetApi(), ort_ctx);
3138 return C::InferOutputShape(ctx);
3139 };
3140 return {};
3141 }
3142
3143 template <typename C>
3147
3148 protected:
3149 // Helper function that returns a map of session config entries specified by CustomOpBase::GetSessionConfigKeys.
3150 void GetSessionConfigs(std::unordered_map<std::string, std::string>& out, ConstSessionOptions options) const;
3151
3152 int start_ver_ = 1;
3153 int end_ver_ = MAX_CUSTOM_OP_END_VER;
3154};
3155
3156// Forward declaration to resolve circular dependency
3157// on ConstNode
3159
3160namespace detail {
3161template <typename T>
3163 using B = Base<T>;
3164 using B::B;
3165
3167 std::string GetName() const;
3173 std::vector<ValueInfoConsumerProducerInfo> GetConsumers() const;
3183 bool IsGraphOutput() const;
3187 bool IsFromOuterScope() const;
3188};
3189} // namespace detail
3190
3191// Const object holder that does not own the underlying object
3193
3198 ValueInfo() = default; // Same thing as with nullptr
3199 explicit ValueInfo(std::nullptr_t) {}
3201 explicit ValueInfo(OrtValueInfo* p) : ConstValueInfoImpl<OrtValueInfo>{p} {}
3202
3203#if !defined(ORT_MINIMAL_BUILD)
3204 // Create ValueInfo for a tensor
3205 explicit ValueInfo(const std::string& name, const ConstTypeInfo& type_info);
3206#endif
3207 ConstValueInfo GetConst() const { return ConstValueInfo{this->p_}; }
3208};
3209
3210// Forward declaration
3211struct AttrNameSubgraph;
3212
3213namespace detail {
3214// Forward decl
3215template <typename T>
3216struct ConstGraphImpl;
3217
3218template <typename T>
3219struct ConstNodeImpl : Base<T> {
3220 using B = Base<T>;
3221 using B::B;
3222
3223 // <Wraps OrtApi::Node_GetId
3224 size_t GetId() const;
3225 // <Wraps OrtApi::Node_GetName
3226 std::string GetName() const;
3227 // <Wraps OrtApi::Node_GetOperatorType
3228 std::string GetOperatorType() const;
3229 // <Wraps OrtApi::Node_GetDomain
3230 std::string GetDomain() const;
3231 // <Wraps OrtApi::Node_GetSinceVersion
3232 int GetSinceVersion() const;
3233
3234 // <Wraps OrtApi::Node_Inputs
3235 std::vector<ConstValueInfo> GetInputs() const;
3236 // <Wraps OrtApi::Node_Outputs
3237 std::vector<ConstValueInfo> GetOutputs() const;
3238 // <Wraps OrtApi::Node_ImplicitInputs
3239 std::vector<ConstValueInfo> GetImplicitInputs() const;
3240 // <Wraps OrtApi::Node_GetAttributes
3241 std::vector<ConstOpAttr> GetAttributes() const;
3242 // <Wraps OrtApi::Node_GetAttributeByName
3243 // Please, read C API doc for details
3244 Status GetAttributeByName(const std::string& name, ConstOpAttr& attr) const;
3245 // <Wraps OrtApi::Node_GetSubgraphs
3246 std::vector<AttrNameSubgraph> GetSubgraphs() const;
3247 // <Wraps OrtApi::Node_GetGraph
3248 // ConstGraph is not available yet
3250 // <Wraps OrtApi::Node_GetEpName
3251 std::string GetEpName() const;
3252};
3253} // namespace detail
3254
3256
3260struct Node : detail::ConstNodeImpl<OrtNode> {
3261 Node() = default; // Same thing as with nullptr
3262 explicit Node(std::nullptr_t) {}
3263 explicit Node(OrtNode* p) : ConstNodeImpl<OrtNode>{p} {}
3264
3265#if !defined(ORT_MINIMAL_BUILD)
3266 Node(const std::string& operator_name, const std::string& operator_domain,
3267 const std::string& node_name,
3268 const std::vector<std::string>& input_names,
3269 const std::vector<std::string>& output_names);
3270
3274 Node(const std::string& operator_name, const std::string& operator_domain,
3275 const std::string& node_name,
3276 const std::vector<std::string>& input_names,
3277 const std::vector<std::string>& output_names,
3278 std::vector<OpAttr>& attributes);
3279
3280 private:
3281 static void Init(const std::string& operator_name, const std::string& operator_domain,
3282 const std::string& node_name,
3283 const std::vector<std::string>& input_names,
3284 const std::vector<std::string>& output_names,
3285 std::vector<OpAttr>& attributes,
3286 OrtNode*& node);
3287#endif // !defined(ORT_MINIMAL_BUILD)
3288};
3289
3290// Return struct for some of ValueInfo APIs.
3291// Must be declared after ConstNode is available.
3294 // either producer output or consumer output index
3295 // producer is unsigned only, output can be -1
3296 int64_t index;
3297};
3298
3299// Represents a return value for Graph::GetOperatorSets()
3301 std::string domain;
3302 int64_t version;
3303};
3304
3305namespace detail {
3306template <typename T>
3308 using B = Base<T>;
3309 using B::B;
3310
3311 // <Wraps OrtApi::Graph_GetName
3312 std::string GetName() const;
3313 // <Wraps OrtApi::Graph_GetModelPath
3314 std::basic_string<ORTCHAR_T> GetModelPath() const;
3315 // <Wraps OrtApi::Graph_GetOnnxIRVersion
3316 int64_t GetOnnxIRVersion() const;
3317 // <Wraps OrtApi::Graph_GetOperatorSets
3318 std::vector<OperatorSet> GetOperatorSets() const;
3319 // <Wraps OrtApi::Graph_Inputs
3320 std::vector<ConstValueInfo> GetInputs() const;
3321 // <Wraps OrtApi::Graph_Outputs
3322 std::vector<ConstValueInfo> GetOutputs() const;
3323 // <Wraps OrtApi::Graph_Initializers
3324 std::vector<ConstValueInfo> GetInitializers() const;
3325 // <Wraps OrtApi::Graph_GetNodes
3326 std::vector<ConstNode> GetNodes() const;
3327 // <Wraps OrtApi::Graph_GetParentGraph
3329 // <Wraps OrtApi::Graph_GetGraphView
3330 Graph GetGraphView(const std::vector<ConstNode>& nodes) const;
3331 // <Wraps OrtApi::Graph_GetModelMetadata
3333};
3334
3335template <typename T>
3338 using B::B;
3339
3340#if !defined(ORT_MINIMAL_BUILD)
3341 // <Wraps GetModelEditorApi().SetGraphInputs()
3342 void SetInputs(std::vector<ValueInfo>& inputs);
3343 // <Wraps GetModelEditorApi().SetGraphOutputs()
3344 void SetOutputs(std::vector<ValueInfo>& outputs);
3345 // <Wraps GetModelEditorApi().AddInitializerToGraph()
3346 void AddInitializer(const std::string& name, Value& initializer, bool data_is_external); // Graph takes ownership of Value
3347 // <Wraps GetModelEditorApi().AddNodeToGraph()
3348 void AddNode(Node& node); // Graph takes ownership of Node
3349#endif // !defined(ORT_MINIMAL_BUILD)
3350};
3351} // namespace detail
3352
3354
3355// Return value for Node API
3356// Must be declared after ConstGraph
3361
3365struct Graph : detail::GraphImpl<OrtGraph> {
3366 explicit Graph(std::nullptr_t) {}
3367 explicit Graph(OrtGraph* p) : GraphImpl<OrtGraph>{p} {}
3368#if !defined(ORT_MINIMAL_BUILD)
3369 // <Wraps GetModelEditorApi().CreateGraph()
3371#endif
3372};
3373
3374namespace detail {
3375template <typename T>
3378 using B::B;
3379
3380#if !defined(ORT_MINIMAL_BUILD)
3381 // <Wraps GetModelEditorApi().AddGraphToModel()
3382 void AddGraph(Graph& graph);
3383#endif
3384};
3385} // namespace detail
3386
3387// Const object holder that does not own the underlying object
3389
3393struct Model : detail::ModelImpl<OrtModel> {
3394 using DomainOpsetPair = std::pair<std::string, int>;
3395
3396 explicit Model(std::nullptr_t) {}
3397 explicit Model(OrtModel* p) : ModelImpl<OrtModel>{p} {}
3398
3399#if !defined(ORT_MINIMAL_BUILD)
3400 //< Wraps GetModelEditorApi().CreateModel()
3401 explicit Model(const std::vector<DomainOpsetPair>& opsets);
3402#endif
3403};
3404
3405namespace detail {
3406template <typename T>
3408 using B = Base<T>;
3409 using B::B;
3410
3412 const char* GetOperatorType() const;
3413
3415 const char* GetDomain() const;
3416
3418 std::pair<int, int> GetSinceVersion() const;
3419
3421 const char* GetExecutionProvider() const;
3422
3424 OrtMemType GetInputMemType(size_t input_index) const;
3425
3427 OrtMemType GetOutputMemType(size_t output_index) const;
3428};
3429} // namespace detail
3430
3432
3435 using Base::Base;
3436
3437 explicit KernelDef(std::nullptr_t) {}
3438 explicit KernelDef(OrtKernelDef* p) : detail::ConstKernelDefImpl<OrtKernelDef>{p} {}
3439
3440 ConstKernelDef GetConst() const { return ConstKernelDef{this->p_}; }
3441};
3442
3447struct KernelDefBuilder : detail::Base<OrtKernelDefBuilder> {
3449 explicit KernelDefBuilder(std::nullptr_t) {}
3450 explicit KernelDefBuilder(OrtKernelDefBuilder* ort_kernel_def_builder);
3451
3452 KernelDefBuilder& SetOperatorType(const char* op_type);
3453 KernelDefBuilder& SetDomain(const char* domain);
3454 KernelDefBuilder& SetSinceVersion(int since_version_start, int since_version_end);
3456 KernelDefBuilder& SetInputMemType(size_t input_index, OrtMemType mem_type);
3457 KernelDefBuilder& SetOutputMemType(size_t output_index, OrtMemType mem_type);
3458 KernelDefBuilder& AddTypeConstraint(const char* arg_name, const OrtDataType* data_type);
3459 KernelDefBuilder& AddTypeConstraint(const char* arg_name, const std::vector<const OrtDataType*>& data_types);
3460 KernelDefBuilder& AddInputOutputAlias(int input_index, int output_index);
3461 KernelDefBuilder& AddInputOutputAliases(const std::vector<int>& input_indices,
3462 const std::vector<int>& output_indices);
3463 KernelDefBuilder& AddInputOutputMutableAlias(int input_index, int output_index);
3464 KernelDefBuilder& AddInputOutputMutableAliases(const std::vector<int>& input_indices,
3465 const std::vector<int>& output_indices);
3466
3468};
3469
3474struct KernelRegistry : detail::Base<OrtKernelRegistry> {
3477
3479 explicit KernelRegistry(std::nullptr_t) {}
3480
3482 explicit KernelRegistry(OrtKernelRegistry* ort_kernel_registry);
3483
3485 Status AddKernel(const OrtKernelDef* kernel_def, OrtKernelCreateFunc kernel_create_func,
3486 void* kernel_create_func_state);
3487};
3488
3489namespace detail {
3490template <typename T>
3493 using B::B;
3494
3495 //< Wraps SharedPrePackedWeightCache_StoreWeightData
3496 Status StoreWeightData(void** buffer_data_ptrs, size_t* buffer_sizes, size_t num_buffers);
3497};
3498} // namespace detail
3499
3517
3520} // namespace Ort
3521#include "onnxruntime_cxx_inline.h"
struct OrtMemoryInfo OrtMemoryInfo
Definition onnxruntime_c_api.h:299
struct OrtKernelInfo OrtKernelInfo
Definition onnxruntime_c_api.h:459
struct OrtNode OrtNode
Definition onnxruntime_c_api.h:327
OrtLoggingLevel
Logging severity levels.
Definition onnxruntime_c_api.h:249
OrtMemoryInfoDeviceType
This mimics OrtDevice type constants so they can be returned in the API.
Definition onnxruntime_c_api.h:494
struct OrtShapeInferContext OrtShapeInferContext
Definition onnxruntime_c_api.h:324
void(* OrtLoggingFunction)(void *param, OrtLoggingLevel severity, const char *category, const char *logid, const char *code_location, const char *message)
Definition onnxruntime_c_api.h:423
void(* OrtCustomJoinThreadFn)(OrtCustomThreadHandle ort_custom_thread_handle)
Custom thread join function.
Definition onnxruntime_c_api.h:960
OrtCustomOpInputOutputCharacteristic
Definition onnxruntime_c_api.h:7215
struct OrtTensorRTProviderOptionsV2 OrtTensorRTProviderOptionsV2
Definition onnxruntime_c_api.h:316
struct OrtThreadingOptions OrtThreadingOptions
Definition onnxruntime_c_api.h:313
struct OrtSequenceTypeInfo OrtSequenceTypeInfo
Definition onnxruntime_c_api.h:307
struct OrtValueInfo OrtValueInfo
Definition onnxruntime_c_api.h:326
struct OrtDnnlProviderOptions OrtDnnlProviderOptions
Definition onnxruntime_c_api.h:320
OrtSparseIndicesFormat
Definition onnxruntime_c_api.h:238
struct OrtPrepackedWeightsContainer OrtPrepackedWeightsContainer
Definition onnxruntime_c_api.h:315
struct OrtSession OrtSession
Definition onnxruntime_c_api.h:301
OrtCompiledModelCompatibility
Definition onnxruntime_c_api.h:1043
OrtStatus *(* EpSelectionDelegate)(const OrtEpDevice **ep_devices, size_t num_devices, const OrtKeyValuePairs *model_metadata, const OrtKeyValuePairs *runtime_metadata, const OrtEpDevice **selected, size_t max_selected, size_t *num_selected, void *state)
Delegate to allow providing custom OrtEpDevice selection logic.
Definition onnxruntime_c_api.h:548
struct OrtCustomOpDomain OrtCustomOpDomain
Definition onnxruntime_c_api.h:310
struct OrtIoBinding OrtIoBinding
Definition onnxruntime_c_api.h:300
struct OrtExternalInitializerInfo OrtExternalInitializerInfo
Definition onnxruntime_c_api.h:335
OrtAllocatorType
Definition onnxruntime_c_api.h:465
struct OrtOp OrtOp
Definition onnxruntime_c_api.h:321
struct OrtTypeInfo OrtTypeInfo
Definition onnxruntime_c_api.h:304
struct OrtTensorTypeAndShapeInfo OrtTensorTypeAndShapeInfo
Definition onnxruntime_c_api.h:305
struct OrtCUDAProviderOptionsV2 OrtCUDAProviderOptionsV2
Definition onnxruntime_c_api.h:318
struct OrtKernelContext OrtKernelContext
Definition onnxruntime_c_api.h:461
struct OrtCANNProviderOptions OrtCANNProviderOptions
Definition onnxruntime_c_api.h:319
struct OrtEpDevice OrtEpDevice
Definition onnxruntime_c_api.h:332
void(* RunAsyncCallbackFn)(void *user_data, OrtValue **outputs, size_t num_outputs, OrtStatusPtr status)
Callback function for RunAsync.
Definition onnxruntime_c_api.h:971
OrtHardwareDeviceType
Definition onnxruntime_c_api.h:501
struct OrtModel OrtModel
Definition onnxruntime_c_api.h:329
struct OrtGraph OrtGraph
Definition onnxruntime_c_api.h:328
struct OrtSyncStream OrtSyncStream
Definition onnxruntime_c_api.h:334
struct OrtSessionOptions OrtSessionOptions
Definition onnxruntime_c_api.h:309
OrtDeviceMemoryType
This matches OrtDevice::MemoryType values.
Definition onnxruntime_c_api.h:487
struct OrtValue OrtValue
Definition onnxruntime_c_api.h:302
OrtStatus *(* OrtWriteBufferFunc)(void *state, const void *buffer, size_t buffer_num_bytes)
Function called by ORT to write a buffer to a custom destination (e.g., file, stream,...
Definition onnxruntime_c_api.h:567
GraphOptimizationLevel
Graph optimization level.
Definition onnxruntime_c_api.h:432
struct OrtKeyValuePairs OrtKeyValuePairs
Definition onnxruntime_c_api.h:333
OrtStatus * OrtStatusPtr
Definition onnxruntime_c_api.h:346
OrtMemType
Memory types for allocated memory, execution provider specific types should be extended in each provi...
Definition onnxruntime_c_api.h:475
OrtSparseFormat
Definition onnxruntime_c_api.h:230
ONNXType
Definition onnxruntime_c_api.h:218
struct OrtEnv OrtEnv
Definition onnxruntime_c_api.h:297
OrtErrorCode
Definition onnxruntime_c_api.h:257
struct OrtStatus OrtStatus
Definition onnxruntime_c_api.h:298
OrtStatus *(* OrtGetInitializerLocationFunc)(void *state, const char *initializer_name, const OrtValue *initializer_value, const OrtExternalInitializerInfo *external_info, OrtExternalInitializerInfo **new_external_info)
Function called by ORT to allow user to specify how an initializer should be saved,...
Definition onnxruntime_c_api.h:601
#define ORT_API_VERSION
The API version defined in this header.
Definition onnxruntime_c_api.h:41
struct OrtLogger OrtLogger
Definition onnxruntime_c_api.h:323
struct OrtMapTypeInfo OrtMapTypeInfo
Definition onnxruntime_c_api.h:306
struct OrtArenaCfg OrtArenaCfg
Definition onnxruntime_c_api.h:314
ExecutionMode
Definition onnxruntime_c_api.h:440
OrtOpAttrType
Definition onnxruntime_c_api.h:275
OrtCustomThreadHandle(* OrtCustomCreateThreadFn)(void *ort_custom_thread_creation_options, OrtThreadWorkerFn ort_thread_worker_fn, void *ort_worker_fn_param)
Ort custom thread creation function.
Definition onnxruntime_c_api.h:953
ONNXTensorElementDataType
Definition onnxruntime_c_api.h:184
OrtExecutionProviderDevicePolicy
These are the default EP selection policies used by ORT when doing automatic EP selection.
Definition onnxruntime_c_api.h:509
const OrtApiBase * OrtGetApiBase(void)
The Onnxruntime library's entry point to access the C API.
@ ORT_LOGGING_LEVEL_WARNING
Warning messages.
Definition onnxruntime_c_api.h:252
@ OrtMemTypeDefault
The default allocator for execution provider.
Definition onnxruntime_c_api.h:483
@ ORT_FAIL
Definition onnxruntime_c_api.h:259
@ ONNX_TENSOR_ELEMENT_DATA_TYPE_FLOAT
Definition onnxruntime_c_api.h:186
std::vector< Value > GetOutputValuesHelper(const OrtIoBinding *binding, OrtAllocator *)
std::vector< std::string > GetOutputNamesHelper(const OrtIoBinding *binding, OrtAllocator *)
void OrtRelease(OrtAllocator *ptr)
Definition onnxruntime_cxx_api.h:629
std::string MakeCustomOpConfigEntryKey(const char *custom_op_name, const char *config)
All C++ Onnxruntime APIs are defined inside this namespace.
Definition onnxruntime_cxx_api.h:48
Ort::KeyValuePairs GetEnvConfigEntries()
const OrtModelEditorApi & GetModelEditorApi()
This returns a reference to the ORT C Model Editor API. Used if building or augmenting a model at run...
Definition onnxruntime_cxx_api.h:215
std::unique_ptr< char, detail::AllocatedFree > AllocatedStringPtr
unique_ptr typedef used to own strings allocated by OrtAllocators and release them at the end of the ...
Definition onnxruntime_cxx_api.h:805
detail::ConstSessionOptionsImpl< detail::Unowned< const OrtSessionOptions > > ConstSessionOptions
Definition onnxruntime_cxx_api.h:1552
detail::KernelInfoImpl< detail::Unowned< const OrtKernelInfo > > ConstKernelInfo
Definition onnxruntime_cxx_api.h:2892
const OrtApi & GetApi() noexcept
This returns a reference to the ORT C API.
Definition onnxruntime_cxx_api.h:189
const OrtCompileApi & GetCompileApi()
This returns a reference to the ORT C Compile API. Used if compiling a model at runtime.
Definition onnxruntime_cxx_api.h:229
AllocatedStringPtr GetCompatibilityInfoFromModelAllocated(const char *model_path, const char *ep_type, OrtAllocator *allocator)
Extract EP compatibility info from a precompiled model file.
AllocatedStringPtr GetCompatibilityInfoFromModelBytesAllocated(const void *model_data, size_t model_data_length, const char *ep_type, OrtAllocator *allocator)
Extract EP compatibility info from precompiled model bytes in memory.
detail::AllocatorImpl< detail::Unowned< OrtAllocator > > UnownedAllocator
Definition onnxruntime_cxx_api.h:1081
OrtCompiledModelCompatibility GetModelCompatibilityForEpDevices(const std::vector< ConstEpDevice > &ep_devices, const char *compatibility_info)
Validate a compiled model's compatibility for one or more EP devices.
const OrtInteropApi & GetInteropApi()
This returns a reference to the ORT C Interop API. Used for external resource import with EPs.
Definition onnxruntime_cxx_api.h:243
detail::SessionOptionsImpl< detail::Unowned< OrtSessionOptions > > UnownedSessionOptions
Definition onnxruntime_cxx_api.h:1551
std::string GetBuildInfoString()
This function returns the onnxruntime build information: including git branch, git commit id,...
const OrtEpApi & GetEpApi()
This returns a reference to the ORT C EP API. Used if authoring a plugin execution provider.
Definition onnxruntime_cxx_api.h:257
std::string GetVersionString()
This function returns the onnxruntime version string.
std::vector< std::string > GetAvailableProviders()
This is a C++ wrapper for OrtApi::GetAvailableProviders() and returns a vector of strings representin...
Ort::Status(*)(Ort::ShapeInferContext &) ShapeInferFn
Definition onnxruntime_cxx_api.h:3011
Status CompileModel(const Env &env, const ModelCompilationOptions &model_compilation_options)
Compiles an input model to generate a model with EPContext nodes that execute EP-specific kernels....
Wrapper around OrtAllocator.
Definition onnxruntime_cxx_api.h:1073
Allocator(const Session &session, const OrtMemoryInfo *)
Take ownership of a pointer created by C API.
Allocator(std::nullptr_t)
Convenience to create a class member and then replace with an instance.
Definition onnxruntime_cxx_api.h:1074
Allocator(OrtAllocator *p)
Definition onnxruntime_cxx_api.h:1078
Wrapper around OrtAllocator default instance that is owned by Onnxruntime.
Definition onnxruntime_cxx_api.h:1064
AllocatorWithDefaultOptions(std::nullptr_t)
Convenience to create a class member and then replace with an instance.
Definition onnxruntime_cxx_api.h:1065
it is a structure that represents the configuration of an arena based allocator
Definition onnxruntime_cxx_api.h:2590
ArenaCfg(std::nullptr_t)
Create an empty ArenaCfg object, must be assigned a valid one to be used.
Definition onnxruntime_cxx_api.h:2591
ArenaCfg(const std::unordered_map< std::string, size_t > &arena_config)
ArenaCfg(size_t max_mem, int arena_extend_strategy, int initial_chunk_size_bytes, int max_dead_bytes_per_chunk)
Definition onnxruntime_cxx_api.h:3357
ConstGraph sub_graph
Definition onnxruntime_cxx_api.h:3359
std::string attr_name
Definition onnxruntime_cxx_api.h:3358
bfloat16 (Brain Floating Point) data type
Definition onnxruntime_cxx_api.h:427
bool operator==(const BFloat16_t &rhs) const noexcept
onnxruntime_float16::BFloat16Impl< BFloat16_t > Base
Definition onnxruntime_cxx_api.h:439
BFloat16_t()=default
static constexpr BFloat16_t FromBits(uint16_t v) noexcept
Explicit conversion to uint16_t representation of bfloat16.
Definition onnxruntime_cxx_api.h:448
bool operator!=(const BFloat16_t &rhs) const noexcept
Definition onnxruntime_cxx_api.h:546
BFloat16_t(float v) noexcept
__ctor from float. Float is converted into bfloat16 16-bit representation.
Definition onnxruntime_cxx_api.h:454
float ToFloat() const noexcept
Converts bfloat16 to float.
Definition onnxruntime_cxx_api.h:460
bool operator<(const BFloat16_t &rhs) const noexcept
The CUDAProviderOptions (V2)
Definition onnxruntime_cxx_api.h:876
CUDAProviderOptions()
Wraps OrtApi::CreateCUDAProviderOptions.
CUDAProviderOptions(std::nullptr_t)
Definition onnxruntime_cxx_api.h:877
void UpdateWithValue(const char *key, void *value)
Wrapper around OrtApi::GetCUDAProviderOptionsByName.
std::string GetCUDAProviderOptionsAsString() const
Wrapper around OrtApi::UpdateCUDAProviderOptionsWithValue.
void Update(const std::unordered_map< std::string, std::string > &options)
Wrapper around OrtApi::GetCUDAProviderOptionsAsString.
void * GetOptionByName(const char *name) const
Definition onnxruntime_cxx_api.h:3016
OrtCustomOpInputOutputCharacteristic GetOutputCharacteristic(size_t) const
Definition onnxruntime_cxx_api.h:3091
OrtCustomOpInputOutputCharacteristic GetInputCharacteristic(size_t) const
Definition onnxruntime_cxx_api.h:3087
OrtMemType GetInputMemoryType(size_t) const
Definition onnxruntime_cxx_api.h:3096
std::vector< std::string > GetSessionConfigKeys() const
Definition onnxruntime_cxx_api.h:3127
bool GetVariadicInputHomogeneity() const
Definition onnxruntime_cxx_api.h:3108
int GetVariadicInputMinArity() const
Definition onnxruntime_cxx_api.h:3102
void SetShapeInferFn(...)
Definition onnxruntime_cxx_api.h:3144
CustomOpBase()
Definition onnxruntime_cxx_api.h:3017
bool GetVariadicOutputHomogeneity() const
Definition onnxruntime_cxx_api.h:3120
int GetVariadicOutputMinArity() const
Definition onnxruntime_cxx_api.h:3114
decltype(&C::InferOutputShape) SetShapeInferFn(decltype(&C::InferOutputShape))
Definition onnxruntime_cxx_api.h:3135
const char * GetExecutionProviderType() const
Definition onnxruntime_cxx_api.h:3083
void GetSessionConfigs(std::unordered_map< std::string, std::string > &out, ConstSessionOptions options) const
Class that represents session configuration entries for one or more custom operators.
Definition onnxruntime_cxx_api.h:1402
~CustomOpConfigs()=default
CustomOpConfigs & AddConfig(const char *custom_op_name, const char *config_key, const char *config_value)
Adds a session configuration entry/value for a specific custom operator.
CustomOpConfigs & operator=(CustomOpConfigs &&o)=default
CustomOpConfigs(CustomOpConfigs &&o)=default
CustomOpConfigs()=default
const std::unordered_map< std::string, std::string > & GetFlattenedConfigs() const
Returns a flattened map of custom operator configuration entries and their values.
CustomOpConfigs(const CustomOpConfigs &)=default
CustomOpConfigs & operator=(const CustomOpConfigs &)=default
Custom Op Domain.
Definition onnxruntime_cxx_api.h:1298
CustomOpDomain(std::nullptr_t)
Create an empty CustomOpDomain object, must be assigned a valid one to be used.
Definition onnxruntime_cxx_api.h:1302
CustomOpDomain(const char *domain)
Wraps OrtApi::CreateCustomOpDomain.
void Add(const OrtCustomOp *op)
Wraps CustomOpDomain_Add.
The Env (Environment)
Definition onnxruntime_cxx_api.h:1238
Env & EnableTelemetryEvents()
Wraps OrtApi::EnableTelemetryEvents.
Env(OrtEnv *p)
C Interop Helper.
Definition onnxruntime_cxx_api.h:1258
Env & CreateAndRegisterAllocatorV2(const std::string &provider_type, const OrtMemoryInfo *mem_info, const std::unordered_map< std::string, std::string > &options, const OrtArenaCfg *arena_cfg)
Wraps OrtApi::CreateAndRegisterAllocatorV2.
Env & UnregisterExecutionProviderLibrary(const char *registration_name)
Wraps OrtApi::UnregisterExecutionProviderLibrary.
std::vector< ConstEpDevice > GetEpDevices() const
Env & UnregisterAllocator(const OrtMemoryInfo *mem_info)
Wraps OrtApi::UnregisterAllocator.
Env(std::nullptr_t)
Create an empty Env object, must be assigned a valid one to be used.
Definition onnxruntime_cxx_api.h:1239
Env(OrtLoggingLevel logging_level=ORT_LOGGING_LEVEL_WARNING, const char *logid="")
Wraps OrtApi::CreateEnv.
Env(const OrtThreadingOptions *tp_options, OrtLoggingLevel logging_level=ORT_LOGGING_LEVEL_WARNING, const char *logid="")
Wraps OrtApi::CreateEnvWithGlobalThreadPools.
Env(const OrtThreadingOptions *tp_options, OrtLoggingFunction logging_function, void *logger_param, OrtLoggingLevel logging_level=ORT_LOGGING_LEVEL_WARNING, const char *logid="")
Wraps OrtApi::CreateEnvWithCustomLoggerAndGlobalThreadPools.
Env & RegisterAllocator(OrtAllocator *allocator)
Wraps OrtApi::RegisterAllocator.
UnownedAllocator CreateSharedAllocator(const OrtEpDevice *ep_device, OrtDeviceMemoryType mem_type, OrtAllocatorType allocator_type, const OrtKeyValuePairs *allocator_options)
Wraps OrtApi::CreateSharedAllocator.
Env(OrtLoggingLevel logging_level, const char *logid, OrtLoggingFunction logging_function, void *logger_param)
Wraps OrtApi::CreateEnvWithCustomLogger.
Env(const OrtEnvCreationOptions *options)
Wraps OrtApi::CreateEnvWithOptions.
Env & CreateAndRegisterAllocator(const OrtMemoryInfo *mem_info, const OrtArenaCfg *arena_cfg)
Wraps OrtApi::CreateAndRegisterAllocator.
UnownedAllocator GetSharedAllocator(const OrtMemoryInfo *mem_info)
Wraps OrtApi::GetSharedAllocator.
Env & RegisterExecutionProviderLibrary(const char *registration_name, const std::basic_string< char > &path)
Wraps OrtApi::RegisterExecutionProviderLibrary.
Env & UpdateEnvWithCustomLogLevel(OrtLoggingLevel log_severity_level)
Wraps OrtApi::UpdateEnvWithCustomLogLevel.
Status CopyTensors(const std::vector< Value > &src_tensors, const std::vector< Value > &dst_tensors, OrtSyncStream *stream) const
Wraps OrtApi::CopyTensors.
void ReleaseSharedAllocator(const OrtEpDevice *ep_device, OrtDeviceMemoryType mem_type)
Wraps OrtApi::ReleaseSharedAllocator.
Env & DisableTelemetryEvents()
Wraps OrtApi::DisableTelemetryEvents.
Mutable EpDevice that is created by EpApi users.
Definition onnxruntime_cxx_api.h:1148
EpDevice(OrtEpDevice *p)
Take ownership of a pointer created by C API.
Definition onnxruntime_cxx_api.h:1150
EpDevice(OrtEpFactory &ep_factory, ConstHardwareDevice &hardware_device, ConstKeyValuePairs ep_metadata={}, ConstKeyValuePairs ep_options={})
Wraps OrtEpApi::CreateEpDevice.
EpDevice(std::nullptr_t)
No instance is created.
Definition onnxruntime_cxx_api.h:1149
All C++ methods that can fail will throw an exception of this type.
Definition onnxruntime_cxx_api.h:54
const char * what() const noexcept override
Definition onnxruntime_cxx_api.h:59
Exception(const std::string &string, OrtErrorCode code)
Definition onnxruntime_cxx_api.h:55
OrtErrorCode GetOrtErrorCode() const
Definition onnxruntime_cxx_api.h:58
Exception(std::string &&string, OrtErrorCode code)
Definition onnxruntime_cxx_api.h:56
Wrapper around OrtExternalInitializerInfo.
Definition onnxruntime_cxx_api.h:927
ConstExternalInitializerInfo GetConst() const
Wraps OrtApi::CreateExternalInitializerInfo.
Definition onnxruntime_cxx_api.h:935
ExternalInitializerInfo(const char *filepath, int64_t file_offset, size_t byte_size)
Wrapper around CreateExternalInitializerInfo that does not throw an exception.
ExternalInitializerInfo(std::nullptr_t)
Definition onnxruntime_cxx_api.h:931
ExternalInitializerInfo(OrtExternalInitializerInfo *p)
Definition onnxruntime_cxx_api.h:932
static Status Create(const char *filepath, int64_t file_offset, size_t byte_size, ExternalInitializerInfo &out)
IEEE 754 half-precision floating point data type.
Definition onnxruntime_cxx_api.h:285
Float16_t()=default
Default constructor.
Float16_t(float v) noexcept
__ctor from float. Float is converted into float16 16-bit representation.
Definition onnxruntime_cxx_api.h:313
onnxruntime_float16::Float16Impl< Float16_t > Base
Definition onnxruntime_cxx_api.h:295
float ToFloat() const noexcept
Converts float16 to float.
Definition onnxruntime_cxx_api.h:319
static constexpr Float16_t FromBits(uint16_t v) noexcept
Explicit conversion to uint16_t representation of float16.
Definition onnxruntime_cxx_api.h:307
float8e4m3fn (Float8 Floating Point) data type
Definition onnxruntime_cxx_api.h:557
uint8_t value
Definition onnxruntime_cxx_api.h:558
constexpr Float8E4M3FN_t(uint8_t v) noexcept
Definition onnxruntime_cxx_api.h:560
constexpr bool operator==(const Float8E4M3FN_t &rhs) const noexcept
Definition onnxruntime_cxx_api.h:563
constexpr Float8E4M3FN_t() noexcept
Definition onnxruntime_cxx_api.h:559
constexpr bool operator!=(const Float8E4M3FN_t &rhs) const noexcept
Definition onnxruntime_cxx_api.h:564
float8e4m3fnuz (Float8 Floating Point) data type
Definition onnxruntime_cxx_api.h:574
constexpr bool operator==(const Float8E4M3FNUZ_t &rhs) const noexcept
Definition onnxruntime_cxx_api.h:580
uint8_t value
Definition onnxruntime_cxx_api.h:575
constexpr Float8E4M3FNUZ_t() noexcept
Definition onnxruntime_cxx_api.h:576
constexpr bool operator!=(const Float8E4M3FNUZ_t &rhs) const noexcept
Definition onnxruntime_cxx_api.h:581
constexpr Float8E4M3FNUZ_t(uint8_t v) noexcept
Definition onnxruntime_cxx_api.h:577
float8e5m2 (Float8 Floating Point) data type
Definition onnxruntime_cxx_api.h:591
constexpr Float8E5M2_t(uint8_t v) noexcept
Definition onnxruntime_cxx_api.h:594
uint8_t value
Definition onnxruntime_cxx_api.h:592
constexpr bool operator!=(const Float8E5M2_t &rhs) const noexcept
Definition onnxruntime_cxx_api.h:598
constexpr Float8E5M2_t() noexcept
Definition onnxruntime_cxx_api.h:593
constexpr bool operator==(const Float8E5M2_t &rhs) const noexcept
Definition onnxruntime_cxx_api.h:597
float8e5m2fnuz (Float8 Floating Point) data type
Definition onnxruntime_cxx_api.h:608
constexpr Float8E5M2FNUZ_t() noexcept
Definition onnxruntime_cxx_api.h:610
constexpr Float8E5M2FNUZ_t(uint8_t v) noexcept
Definition onnxruntime_cxx_api.h:611
constexpr bool operator!=(const Float8E5M2FNUZ_t &rhs) const noexcept
Definition onnxruntime_cxx_api.h:615
constexpr bool operator==(const Float8E5M2FNUZ_t &rhs) const noexcept
Definition onnxruntime_cxx_api.h:614
uint8_t value
Definition onnxruntime_cxx_api.h:609
Wrapper around OrtGraph.
Definition onnxruntime_cxx_api.h:3365
Graph(OrtGraph *p)
Take ownership of a pointer created by C API.
Definition onnxruntime_cxx_api.h:3367
Graph(std::nullptr_t)
No instance is created.
Definition onnxruntime_cxx_api.h:3366
Wrapper around OrtIoBinding.
Definition onnxruntime_cxx_api.h:2579
UnownedIoBinding GetUnowned() const
Definition onnxruntime_cxx_api.h:2583
ConstIoBinding GetConst() const
Definition onnxruntime_cxx_api.h:2582
IoBinding(Session &session)
IoBinding(std::nullptr_t)
Create an empty object for convenience. Sometimes, we want to initialize members later.
Definition onnxruntime_cxx_api.h:2580
This class wraps a raw pointer OrtKernelContext* that is being passed to the custom kernel Compute() ...
Definition onnxruntime_cxx_api.h:2813
KernelContext(OrtKernelContext *context)
Logger GetLogger() const
ConstValue GetInput(size_t index) const
OrtKernelContext * GetOrtKernelContext() const
Definition onnxruntime_cxx_api.h:2827
void ParallelFor(void(*fn)(void *, size_t), size_t total, size_t num_batch, void *usr_data) const
void * GetGPUComputeStream() const
size_t GetInputCount() const
Ort::Allocator GetAllocator(const OrtMemoryInfo &memory_info) const
size_t GetOutputCount() const
UnownedValue GetOutput(size_t index, const std::vector< int64_t > &dims) const
UnownedValue GetOutput(size_t index, const int64_t *dim_values, size_t dim_count) const
Builder for OrtKernelDef.
Definition onnxruntime_cxx_api.h:3447
KernelDefBuilder & AddTypeConstraint(const char *arg_name, const OrtDataType *data_type)
KernelDefBuilder & SetOutputMemType(size_t output_index, OrtMemType mem_type)
KernelDefBuilder & AddInputOutputMutableAliases(const std::vector< int > &input_indices, const std::vector< int > &output_indices)
KernelDefBuilder & SetInputMemType(size_t input_index, OrtMemType mem_type)
KernelDefBuilder & SetDomain(const char *domain)
KernelDefBuilder & AddInputOutputAliases(const std::vector< int > &input_indices, const std::vector< int > &output_indices)
KernelDefBuilder & AddInputOutputAlias(int input_index, int output_index)
KernelDefBuilder & SetExecutionProvider(const char *ep_name)
KernelDefBuilder & SetOperatorType(const char *op_type)
KernelDefBuilder & AddInputOutputMutableAlias(int input_index, int output_index)
KernelDefBuilder()
Wraps OrtEpApi::CreateKernelDefBuilder.
KernelDefBuilder & AddTypeConstraint(const char *arg_name, const std::vector< const OrtDataType * > &data_types)
KernelDefBuilder(std::nullptr_t)
Create an empty object, must be assigned a valid one to be used.
Definition onnxruntime_cxx_api.h:3449
KernelDefBuilder(OrtKernelDefBuilder *ort_kernel_def_builder)
KernelDefBuilder & SetSinceVersion(int since_version_start, int since_version_end)
Definition onnxruntime_cxx_api.h:3433
KernelDef(OrtKernelDef *p)
Definition onnxruntime_cxx_api.h:3438
KernelDef(std::nullptr_t)
Definition onnxruntime_cxx_api.h:3437
ConstKernelDef GetConst() const
Definition onnxruntime_cxx_api.h:3440
This struct owns the OrtKernInfo* pointer when a copy is made. For convenient wrapping of OrtKernelIn...
Definition onnxruntime_cxx_api.h:2900
KernelInfo(OrtKernelInfo *info)
Take ownership of the instance.
ConstKernelInfo GetConst() const
Definition onnxruntime_cxx_api.h:2905
detail::KernelInfoImpl< OrtKernelInfo > Base
Definition onnxruntime_cxx_api.h:2901
KernelInfo(std::nullptr_t)
Create an empty instance to initialize later.
Definition onnxruntime_cxx_api.h:2903
Registry for kernels supported by an EP.
Definition onnxruntime_cxx_api.h:3474
KernelRegistry()
< Wrapper around OrtEpApi::CreateKernelRegistry
KernelRegistry(std::nullptr_t)
Take ownership of a pointer created with the C API.
Definition onnxruntime_cxx_api.h:3479
Status AddKernel(const OrtKernelDef *kernel_def, OrtKernelCreateFunc kernel_create_func, void *kernel_create_func_state)
KernelRegistry(OrtKernelRegistry *ort_kernel_registry)
Wraps KernelRegistry_AddKernel.
Wrapper around OrtKeyValuePairs.
Definition onnxruntime_cxx_api.h:964
KeyValuePairs()
Wraps OrtApi::CreateKeyValuePairs.
void Add(const char *key, const char *value)
Wraps OrtApi::AddKeyValuePair.
KeyValuePairs(const std::unordered_map< std::string, std::string > &kv_pairs)
Wraps OrtApi::CreateKeyValuePairs and OrtApi::AddKeyValuePair.
void Remove(const char *key)
Wraps OrtApi::RemoveKeyValuePair.
KeyValuePairs(std::nullptr_t)
Definition onnxruntime_cxx_api.h:965
ConstKeyValuePairs GetConst() const
Definition onnxruntime_cxx_api.h:981
KeyValuePairs(OrtKeyValuePairs *p)
Take ownership of a pointer created by C API.
Definition onnxruntime_cxx_api.h:967
This class represents an ONNX Runtime logger that can be used to log information with an associated s...
Definition onnxruntime_cxx_api.h:2735
Logger(Logger &&v) noexcept=default
Logger & operator=(Logger &&v) noexcept=default
Logger & operator=(const Logger &)=default
~Logger()=default
Logger(const Logger &)=default
Logger()=default
Logger(std::nullptr_t)
Definition onnxruntime_cxx_api.h:2744
Logger(const OrtLogger *logger)
OrtLoggingLevel GetLoggingSeverityLevel() const noexcept
LoraAdapter holds a set of Lora Parameters loaded from a single file.
Definition onnxruntime_cxx_api.h:1312
static LoraAdapter CreateLoraAdapter(const std::basic_string< char > &adapter_path, OrtAllocator *allocator)
Wraps OrtApi::CreateLoraAdapter.
LoraAdapter(std::nullptr_t)
Definition onnxruntime_cxx_api.h:1316
static LoraAdapter CreateLoraAdapterFromArray(const void *bytes, size_t num_bytes, OrtAllocator *allocator)
Wraps OrtApi::CreateLoraAdapterFromArray.
Wrapper around OrtMapTypeInfo.
Definition onnxruntime_cxx_api.h:1978
ConstMapTypeInfo GetConst() const
Definition onnxruntime_cxx_api.h:1984
MapTypeInfo(OrtMapTypeInfo *p)
Used for interop with the C API.
Definition onnxruntime_cxx_api.h:1983
MapTypeInfo(std::nullptr_t)
Create an empty MapTypeInfo object, must be assigned a valid one to be used.
Definition onnxruntime_cxx_api.h:1982
Represents native memory allocation coming from one of the OrtAllocators registered with OnnxRuntime....
Definition onnxruntime_cxx_api.h:1025
MemoryAllocation(MemoryAllocation &&) noexcept
MemoryAllocation & operator=(const MemoryAllocation &)=delete
MemoryAllocation(const MemoryAllocation &)=delete
MemoryAllocation(OrtAllocator *allocator, void *p, size_t size)
size_t size() const
Definition onnxruntime_cxx_api.h:1034
Wrapper around OrtMemoryInfo.
Definition onnxruntime_cxx_api.h:1009
MemoryInfo(const char *name, OrtAllocatorType type, int id, OrtMemType mem_type)
MemoryInfo(std::nullptr_t)
No instance is created.
Definition onnxruntime_cxx_api.h:1011
MemoryInfo(OrtMemoryInfo *p)
Take ownership of a pointer created by C API.
Definition onnxruntime_cxx_api.h:1012
static MemoryInfo CreateCpu(OrtAllocatorType type, OrtMemType mem_type1)
ConstMemoryInfo GetConst() const
Definition onnxruntime_cxx_api.h:1016
MemoryInfo(const char *name, OrtMemoryInfoDeviceType device_type, uint32_t vendor_id, uint32_t device_id, OrtDeviceMemoryType mem_type, size_t alignment, OrtAllocatorType allocator_type)
Wrapper around CreateMemoryInfo_V2.
Options object used when compiling a model.
Definition onnxruntime_cxx_api.h:1569
ModelCompilationOptions & SetOutputModelWriteFunc(OrtWriteBufferFunc write_func, void *state)
ModelCompilationOptions & SetEpContextEmbedMode(bool embed_ep_context_in_model)
Wraps OrtApi::ModelCompilationOptions_SetEpContextEmbedMode.
ModelCompilationOptions & SetInputModelFromBuffer(const void *input_model_data, size_t input_model_data_size)
Wraps OrtApi::ModelCompilationOptions_SetInputModelFromBuffer.
ModelCompilationOptions & SetOutputModelBuffer(OrtAllocator *allocator, void **output_model_buffer_ptr, size_t *output_model_buffer_size_ptr)
Wraps OrtApi::ModelCompilationOptions_SetOutputModelBuffer.
ModelCompilationOptions & SetFlags(uint32_t flags)
Wraps OrtApi::ModelCompilationOptions_SetFlags.
ModelCompilationOptions & SetOutputModelExternalInitializersFile(const char *file_path, size_t initializer_size_threshold)
Wraps OrtApi::ModelCompilationOptions_SetOutputModelExternalInitializersFile.
ModelCompilationOptions(std::nullptr_t)
Create an empty ModelCompilationOptions object, must be assigned a valid one to be used.
Definition onnxruntime_cxx_api.h:1573
ModelCompilationOptions(const Env &env, ConstSessionOptions session_options)
Wraps OrtApi::CreateModelCompilationOptionsFromSessionOptions.
ModelCompilationOptions & SetOutputModelPath(const char *output_model_path)
Wraps OrtApi::ModelCompilationOptions_SetOutputModelPath.
ModelCompilationOptions & SetInputModelPath(const char *input_model_path)
Wraps OrtApi::ModelCompilationOptions_SetInputModelPath.
ModelCompilationOptions & SetOutputModelGetInitializerLocationFunc(OrtGetInitializerLocationFunc get_initializer_location_func, void *state)
ModelCompilationOptions & SetEpContextBinaryInformation(const char *output_directory, const char *model_name)
Wraps OrtApi::ModelCompilationOptions_SetEpContextBinaryInformation.
ModelCompilationOptions & SetGraphOptimizationLevel(GraphOptimizationLevel graph_optimization_level)
Wraps OrtApi::ModelCompilationOptions_SetGraphOptimizationLevel.
ModelCompilationOptions(const Env &env, const SessionOptions &session_options)
Wraps OrtApi::CreateModelCompilationOptionsFromSessionOptions.
Wrapper around OrtModel.
Definition onnxruntime_cxx_api.h:3393
Model(const std::vector< DomainOpsetPair > &opsets)
Model(OrtModel *p)
Take ownership of a pointer created by C API.
Definition onnxruntime_cxx_api.h:3397
std::pair< std::string, int > DomainOpsetPair
Definition onnxruntime_cxx_api.h:3394
Model(std::nullptr_t)
No instance is created.
Definition onnxruntime_cxx_api.h:3396
Wrapper around OrtModelMetadata.
Definition onnxruntime_cxx_api.h:1615
AllocatedStringPtr GetDescriptionAllocated(OrtAllocator *allocator) const
Returns a copy of the description.
std::vector< AllocatedStringPtr > GetCustomMetadataMapKeysAllocated(OrtAllocator *allocator) const
Returns a vector of copies of the custom metadata keys.
ModelMetadata(std::nullptr_t)
Create an empty ModelMetadata object, must be assigned a valid one to be used.
Definition onnxruntime_cxx_api.h:1619
AllocatedStringPtr GetGraphDescriptionAllocated(OrtAllocator *allocator) const
Returns a copy of the graph description.
AllocatedStringPtr GetProducerNameAllocated(OrtAllocator *allocator) const
Returns a copy of the producer name.
AllocatedStringPtr GetGraphNameAllocated(OrtAllocator *allocator) const
Returns a copy of the graph name.
AllocatedStringPtr LookupCustomMetadataMapAllocated(const char *key, OrtAllocator *allocator) const
Looks up a value by a key in the Custom Metadata map.
AllocatedStringPtr GetDomainAllocated(OrtAllocator *allocator) const
Returns a copy of the domain name.
int64_t GetVersion() const
Wraps OrtApi::ModelMetadataGetVersion.
Wrapper around OrtNode.
Definition onnxruntime_cxx_api.h:3260
Node(const std::string &operator_name, const std::string &operator_domain, const std::string &node_name, const std::vector< std::string > &input_names, const std::vector< std::string > &output_names)
Node()=default
Node(std::nullptr_t)
No instance is created.
Definition onnxruntime_cxx_api.h:3262
Node(const std::string &operator_name, const std::string &operator_domain, const std::string &node_name, const std::vector< std::string > &input_names, const std::vector< std::string > &output_names, std::vector< OpAttr > &attributes)
Wraps CreateNode. Node takes ownership of attributes on success and updates the OpAttr in attributes ...
Node(OrtNode *p)
Take ownership of a pointer created by C API.
Definition onnxruntime_cxx_api.h:3263
This struct provides life time management for custom op attribute.
Definition onnxruntime_cxx_api.h:2644
OpAttr(const char *name, const void *data, int len, OrtOpAttrType type)
OpAttr()=default
OpAttr(std::nullptr_t)
Definition onnxruntime_cxx_api.h:2649
ConstOpAttr GetConst() const
Definition onnxruntime_cxx_api.h:2652
Create and own custom defined operation.
Definition onnxruntime_cxx_api.h:2911
Op(OrtOp *)
Take ownership of the OrtOp.
static Op Create(const OrtKernelInfo *info, const char *op_name, const char *domain, int version, const char **type_constraint_names, const ONNXTensorElementDataType *type_constraint_values, size_t type_constraint_count, const OpAttr *attr_values, size_t attr_count, size_t input_count, size_t output_count)
Op(std::nullptr_t)
Create an empty Operator object, must be assigned a valid one to be used.
Definition onnxruntime_cxx_api.h:2915
void Invoke(const OrtKernelContext *context, const OrtValue *const *input_values, size_t input_count, OrtValue *const *output_values, size_t output_count)
void Invoke(const OrtKernelContext *context, const Value *input_values, size_t input_count, Value *output_values, size_t output_count)
Definition onnxruntime_cxx_api.h:3300
std::string domain
Definition onnxruntime_cxx_api.h:3301
int64_t version
Definition onnxruntime_cxx_api.h:3302
The PrepackedWeightsContainer.
Definition onnxruntime_cxx_api.h:895
PrepackedWeightsContainer()
Wraps OrtApi::CreatePrepackedWeightsContainer.
PrepackedWeightsContainer(OrtPrepackedWeightsContainer *p)
Definition onnxruntime_cxx_api.h:900
PrepackedWeightsContainer(std::nullptr_t)
Take ownership of a pointer created by C API.
Definition onnxruntime_cxx_api.h:898
RunOptions.
Definition onnxruntime_cxx_api.h:1340
int GetRunLogSeverityLevel() const
Wraps OrtApi::RunOptionsGetRunLogSeverityLevel.
RunOptions & SetTerminate()
Terminates all currently executing Session::Run calls that were made using this RunOptions instance.
RunOptions & SetSyncStream(OrtSyncStream *stream)
Associate a sync stream with the run options.
RunOptions & SetRunTag(const char *run_tag)
wraps OrtApi::RunOptionsSetRunTag
RunOptions & AddActiveLoraAdapter(const LoraAdapter &adapter)
Add the LoraAdapter to the list of active adapters. The setting does not affect RunWithBinding() call...
RunOptions & UnsetTerminate()
Clears the terminate flag so this RunOptions instance can be used in a new Session::Run call without ...
int GetRunLogVerbosityLevel() const
Wraps OrtApi::RunOptionsGetRunLogVerbosityLevel.
RunOptions(std::nullptr_t)
Create an empty RunOptions object, must be assigned a valid one to be used.
Definition onnxruntime_cxx_api.h:1341
RunOptions & SetRunLogVerbosityLevel(int)
Wraps OrtApi::RunOptionsSetRunLogVerbosityLevel.
RunOptions & SetRunLogSeverityLevel(int)
Wraps OrtApi::RunOptionsSetRunLogSeverityLevel.
RunOptions & AddConfigEntry(const char *config_key, const char *config_value)
Wraps OrtApi::AddRunConfigEntry.
const char * GetRunTag() const
Wraps OrtApi::RunOptionsGetRunTag.
RunOptions()
Wraps OrtApi::CreateRunOptions.
const char * GetConfigEntry(const char *config_key)
Wraps OrtApi::GetRunConfigEntry.
Wrapper around OrtSequenceTypeInfo.
Definition onnxruntime_cxx_api.h:1940
SequenceTypeInfo(std::nullptr_t)
Create an empty SequenceTypeInfo object, must be assigned a valid one to be used.
Definition onnxruntime_cxx_api.h:1944
ConstSequenceTypeInfo GetConst() const
Definition onnxruntime_cxx_api.h:1946
SequenceTypeInfo(OrtSequenceTypeInfo *p)
Used for interop with the C API.
Definition onnxruntime_cxx_api.h:1945
Wrapper around OrtSession.
Definition onnxruntime_cxx_api.h:1841
Session(std::nullptr_t)
Create an empty Session object, must be assigned a valid one to be used. Wraps OrtApi::CreateSession.
Definition onnxruntime_cxx_api.h:1843
static Session CreateModelEditorSession(const Env &env, const void *model_data, size_t model_data_length, const SessionOptions &options)
Wraps OrtModelEditorApi::CreateModelEditorSession.
UnownedSession GetUnowned() const
Definition onnxruntime_cxx_api.h:1872
Session(const Env &env, const char *model_path, const SessionOptions &options, OrtPrepackedWeightsContainer *prepacked_weights_container)
Wraps OrtApi::CreateSessionWithPrepackedWeightsContainer.
Session(const Env &env, const void *model_data, size_t model_data_length, const SessionOptions &options, OrtPrepackedWeightsContainer *prepacked_weights_container)
Wraps OrtApi::CreateSessionFromArrayWithPrepackedWeightsContainer.
Session(const Env &env, const Model &model, const SessionOptions &options)
Wraps OrtModelEditorApi::CreateSessionFromModel.
Session(OrtSession *p)
C API Interop.
Definition onnxruntime_cxx_api.h:1844
static Session CreateModelEditorSession(const Env &env, const char *model_path, const SessionOptions &options)
Wraps OrtModelEditorApi::CreateModelEditorSession.
Session(const Env &env, const char *model_path, const SessionOptions &options)
ConstSession GetConst() const
Definition onnxruntime_cxx_api.h:1871
Session(const Env &env, const void *model_data, size_t model_data_length, const SessionOptions &options)
Wraps OrtApi::CreateSessionFromArray.
Wrapper around OrtSessionOptions.
Definition onnxruntime_cxx_api.h:1557
SessionOptions(std::nullptr_t)
Create an empty SessionOptions object, must be assigned a valid one to be used.
Definition onnxruntime_cxx_api.h:1558
UnownedSessionOptions GetUnowned() const
Definition onnxruntime_cxx_api.h:1561
SessionOptions()
Wraps OrtApi::CreateSessionOptions.
ConstSessionOptions GetConst() const
Definition onnxruntime_cxx_api.h:1562
SessionOptions(OrtSessionOptions *p)
Used for interop with the C API.
Definition onnxruntime_cxx_api.h:1560
Definition onnxruntime_cxx_api.h:2945
SymbolicInteger & operator=(const SymbolicInteger &)=default
SymbolicInteger(const SymbolicInteger &)=default
int64_t AsInt() const
Definition onnxruntime_cxx_api.h:2966
int64_t i_
Definition onnxruntime_cxx_api.h:2973
const char * s_
Definition onnxruntime_cxx_api.h:2974
bool operator==(const SymbolicInteger &dim) const
Definition onnxruntime_cxx_api.h:2954
SymbolicInteger & operator=(SymbolicInteger &&)=default
SymbolicInteger(SymbolicInteger &&)=default
const char * AsSym() const
Definition onnxruntime_cxx_api.h:2967
SymbolicInteger(int64_t i)
Definition onnxruntime_cxx_api.h:2946
SymbolicInteger(const char *s)
Definition onnxruntime_cxx_api.h:2947
bool IsInt() const
Definition onnxruntime_cxx_api.h:2965
Provide access to per-node attributes and input shapes, so one could compute and set output shapes.
Definition onnxruntime_cxx_api.h:2944
Ints GetAttrInts(const char *attr_name)
Strings GetAttrStrings(const char *attr_name)
Status SetOutputShape(size_t indice, const Shape &shape, ONNXTensorElementDataType type=ONNX_TENSOR_ELEMENT_DATA_TYPE_FLOAT)
std::vector< SymbolicInteger > Shape
Definition onnxruntime_cxx_api.h:2979
std::vector< float > Floats
Definition onnxruntime_cxx_api.h:2996
std::string GetAttrString(const char *attr_name)
std::vector< int64_t > Ints
Definition onnxruntime_cxx_api.h:2991
ShapeInferContext(const OrtApi *ort_api, OrtShapeInferContext *ctx)
int64_t GetAttrInt(const char *attr_name)
size_t GetInputCount() const
Definition onnxruntime_cxx_api.h:2985
std::vector< std::string > Strings
Definition onnxruntime_cxx_api.h:3001
Floats GetAttrFloats(const char *attr_name)
const Shape & GetInputShape(size_t indice) const
Definition onnxruntime_cxx_api.h:2983
float GetAttrFloat(const char *attr_name)
The Status that holds ownership of OrtStatus received from C API Use it to safely destroy OrtStatus* ...
Definition onnxruntime_cxx_api.h:811
OrtErrorCode GetErrorCode() const
Status(const Exception &)
Creates status instance out of exception.
bool IsOK() const noexcept
Returns true if instance represents an OK (non-error) status.
Status(OrtStatus *status) noexcept
Takes ownership of OrtStatus instance returned from the C API.
std::string GetErrorMessage() const
Status()=default
Status(const std::exception &)
Creates status instance out of exception.
Status(const char *message, OrtErrorCode code)
Creates status instance out of null-terminated string message.
Status(std::nullptr_t) noexcept
Create an empty object, must be assigned a valid one to be used.
Definition onnxruntime_cxx_api.h:813
Definition onnxruntime_cxx_api.h:1097
SyncStream(OrtSyncStream *p)
Definition onnxruntime_cxx_api.h:1101
SyncStream(std::nullptr_t)
< Create an empty SyncStream object, must be assigned a valid one to be used
Definition onnxruntime_cxx_api.h:1099
The TensorRTOptions (V2)
Definition onnxruntime_cxx_api.h:857
void Update(const std::unordered_map< std::string, std::string > &options)
Wrapper around OrtApi::UpdateTensorRTProviderOptions.
void UpdateWithValue(const char *key, void *value)
Wrapper around OrtApi::GetTensorRTProviderOptionsByName.
std::string GetTensorRTProviderOptionsAsString() const
void * GetOptionByName(const char *name) const
Wrapper around OrtApi::GetTensorRTProviderOptionsAsString.
TensorRTProviderOptions(std::nullptr_t)
Definition onnxruntime_cxx_api.h:858
TensorRTProviderOptions()
Wraps OrtApi::CreateTensorRTProviderOptionsV2.
Wrapper around OrtTensorTypeAndShapeInfo.
Definition onnxruntime_cxx_api.h:1906
TensorTypeAndShapeInfo(std::nullptr_t)
Create an empty TensorTypeAndShapeInfo object, must be assigned a valid one to be used.
Definition onnxruntime_cxx_api.h:1911
ConstTensorTypeAndShapeInfo GetConst() const
Definition onnxruntime_cxx_api.h:1922
TensorTypeAndShapeInfo(OrtTensorTypeAndShapeInfo *p)
Used for interop with the C API.
Definition onnxruntime_cxx_api.h:1913
TensorTypeAndShapeInfo(ONNXTensorElementDataType element_type, const std::vector< int64_t > &dims, const std::vector< std::string > *symbolic_dims=nullptr)
The ThreadingOptions.
Definition onnxruntime_cxx_api.h:827
ThreadingOptions & SetGlobalCustomThreadCreationOptions(void *ort_custom_thread_creation_options)
Wraps OrtApi::SetGlobalCustomThreadCreationOptions.
ThreadingOptions()
Wraps OrtApi::CreateThreadingOptions.
ThreadingOptions & SetGlobalInterOpNumThreads(int inter_op_num_threads)
Wraps OrtApi::SetGlobalInterOpNumThreads.
ThreadingOptions & SetGlobalCustomCreateThreadFn(OrtCustomCreateThreadFn ort_custom_create_thread_fn)
Wraps OrtApi::SetGlobalCustomCreateThreadFn.
ThreadingOptions & SetGlobalCustomJoinThreadFn(OrtCustomJoinThreadFn ort_custom_join_thread_fn)
Wraps OrtApi::SetGlobalCustomJoinThreadFn.
ThreadingOptions & SetGlobalSpinControl(int allow_spinning)
Wraps OrtApi::SetGlobalSpinControl.
ThreadingOptions & SetGlobalDenormalAsZero()
Wraps OrtApi::SetGlobalDenormalAsZero.
ThreadingOptions & SetGlobalIntraOpNumThreads(int intra_op_num_threads)
Wraps OrtApi::SetGlobalIntraOpNumThreads.
Type information that may contain either TensorTypeAndShapeInfo or the information about contained se...
Definition onnxruntime_cxx_api.h:2012
static TypeInfo CreateOptionalTypeInfo(ConstTypeInfo contained_type)
static TypeInfo CreateSequenceTypeInfo(ConstTypeInfo sequence_type)
static TypeInfo CreateTensorInfo(ConstTensorTypeAndShapeInfo tensor_info)
static TypeInfo CreateSparseTensorInfo(ConstTensorTypeAndShapeInfo sparse_tensor_info)
TypeInfo(std::nullptr_t)
Create an empty TypeInfo object, must be assigned a valid one to be used.
Definition onnxruntime_cxx_api.h:2017
static TypeInfo CreateMapTypeInfo(ONNXTensorElementDataType key_type, ConstTypeInfo value_type)
ConstTypeInfo GetConst() const
Definition onnxruntime_cxx_api.h:2028
TypeInfo(OrtTypeInfo *p)
C API Interop.
Definition onnxruntime_cxx_api.h:2018
Wrapper around OrtValue.
Definition onnxruntime_cxx_api.h:2368
static Value CreateSparseTensor(const OrtMemoryInfo *info, void *p_data, const Shape &dense_shape, const Shape &values_shape, ONNXTensorElementDataType type)
Creates an OrtValue instance containing SparseTensor. This constructs a sparse tensor that makes use ...
static Value CreateSparseTensor(const OrtMemoryInfo *info, T *p_data, const Shape &dense_shape, const Shape &values_shape)
This is a simple forwarding method to the other overload that helps deducing data type enum value fro...
Value & operator=(Value &&)=default
static Value CreateSparseTensor(OrtAllocator *allocator, const Shape &dense_shape, ONNXTensorElementDataType type)
Creates an instance of OrtValue containing sparse tensor. The created instance has no data....
Value(Value &&)=default
Value(std::nullptr_t)
Create an empty Value object, must be assigned a valid one to be used.
Definition onnxruntime_cxx_api.h:2374
static Value CreateTensor(const OrtMemoryInfo *info, T *p_data, size_t p_data_element_count, const int64_t *shape, size_t shape_len)
Creates a tensor with a user supplied buffer. Wraps OrtApi::CreateTensorWithDataAsOrtValue.
static Value CreateSparseTensor(OrtAllocator *allocator, const Shape &dense_shape)
This is a simple forwarding method to the below CreateSparseTensor. This helps to specify data type e...
static Value CreateTensor(OrtAllocator *allocator, const int64_t *shape, size_t shape_len, ONNXTensorElementDataType type)
Creates an OrtValue with a tensor using the supplied OrtAllocator. Wraps OrtApi::CreateTensorAsOrtVal...
UnownedValue GetUnowned() const
Definition onnxruntime_cxx_api.h:2379
static Value CreateSequence(const std::vector< Value > &values)
Creates an OrtValue with a Sequence Onnx type representation. The API would ref-count the supplied Or...
static Value CreateMap(const Value &keys, const Value &values)
Creates an OrtValue with a Map Onnx type representation. The API would ref-count the supplied OrtValu...
static Value CreateTensor(const OrtMemoryInfo *info, void *p_data, size_t p_data_byte_count, const int64_t *shape, size_t shape_len, ONNXTensorElementDataType type)
Creates a tensor with a user supplied buffer. Wraps OrtApi::CreateTensorWithDataAsOrtValue.
static Value CreateTensor(OrtAllocator *allocator, const int64_t *shape, size_t shape_len)
Creates an OrtValue with a tensor using a supplied OrtAllocator. Wraps OrtApi::CreateTensorAsOrtValue...
static Value CreateOpaque(const char *domain, const char *type_name, const T &value)
Creates an OrtValue wrapping an Opaque type. This is used for experimental support of non-tensor type...
static Value CreateTensor(OrtAllocator *deleter, void *p_data, size_t p_data_byte_count, const int64_t *shape, size_t shape_len, ONNXTensorElementDataType type)
Creates a tensor with a user supplied buffer. Wraps OrtApi::CreateTensorWithDataAndDeleterAsOrtValue.
ConstValue GetConst() const
Definition onnxruntime_cxx_api.h:2378
Definition onnxruntime_cxx_api.h:3292
int64_t index
Definition onnxruntime_cxx_api.h:3296
ConstNode node
Definition onnxruntime_cxx_api.h:3293
Wrapper around OrtValueInfo.
Definition onnxruntime_cxx_api.h:3197
ConstValueInfo GetConst() const
Definition onnxruntime_cxx_api.h:3207
ValueInfo(std::nullptr_t)
Definition onnxruntime_cxx_api.h:3199
ValueInfo(const std::string &name, const ConstTypeInfo &type_info)
ValueInfo(OrtValueInfo *p)
Take ownership of a pointer created by C API.
Definition onnxruntime_cxx_api.h:3201
ValueInfo()=default
Definition onnxruntime_cxx_api.h:773
AllocatedFree(OrtAllocator *allocator)
Definition onnxruntime_cxx_api.h:775
OrtAllocator * allocator_
Definition onnxruntime_cxx_api.h:774
void operator()(void *ptr) const
Definition onnxruntime_cxx_api.h:777
Base & operator=(Base &&v) noexcept
Definition onnxruntime_cxx_api.h:759
constexpr contained_type & operator*() const noexcept
Definition onnxruntime_cxx_api.h:766
typename Unowned< T >::Type contained_type
Definition onnxruntime_cxx_api.h:748
Base(Base &&v) noexcept
Definition onnxruntime_cxx_api.h:758
Base(const Base &)=default
constexpr Base(contained_type *p) noexcept
Definition onnxruntime_cxx_api.h:751
Base & operator=(const Base &)=default
Used internally by the C++ API. C++ wrapper types inherit from this. This is a zero cost abstraction ...
Definition onnxruntime_cxx_api.h:701
Base(Base &&v) noexcept
Definition onnxruntime_cxx_api.h:713
constexpr Base()=default
constexpr contained_type & operator*() const noexcept
Definition onnxruntime_cxx_api.h:721
contained_type * release()
Relinquishes ownership of the contained C object pointer The underlying object is not destroyed.
Definition onnxruntime_cxx_api.h:725
Base(const Base &)=delete
constexpr Base(contained_type *p) noexcept
Definition onnxruntime_cxx_api.h:705
Base & operator=(const Base &)=delete
Base & operator=(Base &&v) noexcept
Definition onnxruntime_cxx_api.h:714
contained_type * p_
Definition onnxruntime_cxx_api.h:732
~Base()
Definition onnxruntime_cxx_api.h:706
T contained_type
Definition onnxruntime_cxx_api.h:702
Definition onnxruntime_cxx_api.h:907
const std::basic_string< char > GetFilePath() const
Definition onnxruntime_cxx_api.h:3307
std::vector< ConstNode > GetNodes() const
std::vector< ConstValueInfo > GetInputs() const
ConstNode GetParentNode() const
int64_t GetOnnxIRVersion() const
std::basic_string< char > GetModelPath() const
Graph GetGraphView(const std::vector< ConstNode > &nodes) const
ModelMetadata GetModelMetadata() const
Wraps OrtApi::Graph_GetModelMetadata.
std::vector< ConstValueInfo > GetInitializers() const
std::string GetName() const
std::vector< ConstValueInfo > GetOutputs() const
std::vector< OperatorSet > GetOperatorSets() const
Definition onnxruntime_cxx_api.h:2547
std::vector< Value > GetOutputValues(OrtAllocator *) const
std::vector< std::string > GetOutputNames(OrtAllocator *) const
std::vector< Value > GetOutputValues() const
std::vector< std::string > GetOutputNames() const
Definition onnxruntime_cxx_api.h:3407
std::pair< int, int > GetSinceVersion() const
Wraps OrtEpApi::KernelDef_GetExecutionProvider.
const char * GetDomain() const
Wraps OrtEpApi::KernelDef_GetSinceVersion.
OrtMemType GetOutputMemType(size_t output_index) const
const char * GetExecutionProvider() const
Wraps OrtEpApi::KernelDef_GetInputMemType.
OrtMemType GetInputMemType(size_t input_index) const
Wraps OrtEpApi::KernelDef_GetOutputMemType.
const char * GetOperatorType() const
< Wraps OrtEpApi::KernelDef_GetOperatorType
Definition onnxruntime_cxx_api.h:3219
std::vector< ConstValueInfo > GetOutputs() const
std::vector< ConstValueInfo > GetImplicitInputs() const
std::string GetName() const
std::string GetDomain() const
std::vector< AttrNameSubgraph > GetSubgraphs() const
ConstGraphImpl< detail::Unowned< const OrtGraph > > GetGraph() const
std::string GetOperatorType() const
std::vector< ConstOpAttr > GetAttributes() const
std::vector< ConstValueInfo > GetInputs() const
Status GetAttributeByName(const std::string &name, ConstOpAttr &attr) const
std::string GetEpName() const
Definition onnxruntime_cxx_api.h:2616
std::string GetName() const
Status GetValue(R &out) const
Status GetTensorAttributeAsOrtValue(Value &) const
Status GetValueArray(std::vector< R > &out) const
OrtOpAttrType GetType() const
Definition onnxruntime_cxx_api.h:1690
std::vector< std::string > GetOutputNames() const
TypeInfo GetInputTypeInfo(size_t index) const
Wraps OrtApi::SessionGetInputTypeInfo.
std::vector< ConstEpAssignedSubgraph > GetEpGraphAssignmentInfo() const
Returns information on the subgraph/nodes assigned to execution providers in the session.
size_t GetOutputCount() const
Returns the number of model outputs.
std::vector< ValueInfo > GetOutputs() const
int GetOpset(const std::string &domain) const
Wraps OrtApi::SessionGetOpsetForDomain.
uint64_t GetProfilingStartTimeNs() const
Wraps OrtApi::SessionGetProfilingStartTimeNs.
std::vector< ConstEpDevice > GetEpDeviceForOutputs() const
Wrapper for OrtApi::SessionGetEpDeviceForOutputs.
std::vector< std::string > GetOverridableInitializerNames() const
ModelMetadata GetModelMetadata() const
Wraps OrtApi::SessionGetModelMetadata.
size_t GetInputCount() const
Returns the number of model inputs.
TypeInfo GetOutputTypeInfo(size_t index) const
Wraps OrtApi::SessionGetOutputTypeInfo.
std::vector< std::string > GetInputNames() const
AllocatedStringPtr GetOverridableInitializerNameAllocated(size_t index, OrtAllocator *allocator) const
Returns a copy of the overridable initializer name at then specified index.
std::vector< ConstEpDevice > GetEpDeviceForInputs() const
Wrapper for OrtApi::SessionGetEpDeviceForInputs.
AllocatedStringPtr GetOutputNameAllocated(size_t index, OrtAllocator *allocator) const
Returns a copy of output name at then specified index.
size_t GetOverridableInitializerCount() const
Returns the number of inputs that have defaults that can be overridden.
std::vector< ConstMemoryInfo > GetMemoryInfoForOutputs() const
Wrapper for OrtApi::SessionGetMemoryInfoForOutputs.
AllocatedStringPtr GetInputNameAllocated(size_t index, OrtAllocator *allocator) const
Returns a copy of input name at the specified index.
std::vector< ConstMemoryInfo > GetMemoryInfoForInputs() const
Wrapper for OrtApi::SessionGetMemoryInfoForInputs.
std::vector< ValueInfo > GetInputs() const
TypeInfo GetOverridableInitializerTypeInfo(size_t index) const
Wraps OrtApi::SessionGetOverridableInitializerTypeInfo.
Definition onnxruntime_cxx_api.h:2057
void GetStringTensorContent(void *buffer, size_t buffer_length, size_t *offsets, size_t offsets_count) const
The API copies all of the UTF-8 encoded string data contained within a tensor or a sparse tensor into...
void GetStringTensorElement(size_t buffer_length, size_t element_index, void *buffer) const
The API copies UTF-8 encoded bytes for the requested string element contained within a tensor or a sp...
TensorTypeAndShapeInfo GetSparseTensorIndicesTypeShapeInfo(OrtSparseIndicesFormat format) const
The API returns type and shape information for the specified indices. Each supported indices have the...
const void * GetTensorRawData() const
Returns a non-typed pointer to a tensor contained data.
std::string GetStringTensorElement(size_t element_index) const
Returns string tensor UTF-8 encoded string element. Use of this API is recommended over GetStringTens...
size_t GetStringTensorElementLength(size_t element_index) const
The API returns a byte length of UTF-8 encoded string element contained in either a tensor or a spare...
size_t GetStringTensorDataLength() const
This API returns a full length of string data contained within either a tensor or a sparse Tensor....
bool IsSparseTensor() const
Returns true if the OrtValue contains a sparse tensor.
TypeInfo GetTypeInfo() const
The API returns type information for data contained in a tensor. For sparse tensors it returns type i...
const R * GetSparseTensorIndicesData(OrtSparseIndicesFormat indices_format, size_t &num_indices) const
The API retrieves a pointer to the internal indices buffer. The API merely performs a convenience dat...
bool IsTensor() const
Returns true if Value is a tensor, false for other types like map/sequence/etc.
ConstMemoryInfo GetTensorMemoryInfo() const
This API returns information about the memory allocation used to hold data.
size_t GetTensorSizeInBytes() const
Returns the total size of the tensor data in bytes. Throws an exception if the OrtValue does not cont...
const R * GetSparseTensorValues() const
The API returns a pointer to an internal buffer of the sparse tensor containing non-zero values....
TensorTypeAndShapeInfo GetTensorTypeAndShapeInfo() const
The API returns type information for data contained in a tensor. For sparse tensors it returns type i...
Value GetValue(int index, OrtAllocator *allocator) const
size_t GetCount() const
< Return true if OrtValue contains data and returns false if the OrtValue is a None
void GetOpaqueData(const char *domain, const char *type_name, R &) const
Obtains a pointer to a user defined data for experimental purposes.
TensorTypeAndShapeInfo GetSparseTensorValuesTypeAndShapeInfo() const
The API returns type and shape information for stored non-zero values of the sparse tensor....
const R * GetTensorData() const
Returns a const typed pointer to the tensor contained data. No type checking is performed,...
OrtSparseFormat GetSparseFormat() const
The API returns the sparse data format this OrtValue holds in a sparse tensor. If the sparse tensor w...
Definition onnxruntime_cxx_api.h:3162
Status GetInitializer(ConstValue &value) const
< A wrapper around OrtApi::ValueInfo_GetInitializerValue
std::string GetName() const
< A wrapper around OrtApi::GetValueInfoName
bool IsFromOuterScope() const
< A wrapper around OrtApi::ValueInfo_IsFromOuterScope
Status GetExternalInitializerInfo(ExternalInitializerInfo &info) const
< A wrapper around OrtApi::ValueInfo_GetExternalInitializerInfo
bool IsConstantInitializer() const
< A wrapper around OrtApi::ValueInfo_IsConstantInitializer
std::vector< ValueInfoConsumerProducerInfo > GetConsumers() const
< A wrapper around OrtApi::ValueInfo_GetValueConsumers
bool IsGraphOutput() const
< A wrapper around OrtApi::ValueInfo_IsGraphOutput
bool IsRequiredGraphInput() const
< A wrapper around OrtApi::ValueInfo_IsRequiredGraphInput
ConstTypeInfo TypeInfo() const
< A wrapper around OrtApi::GetValueInfoTypeInfo
ValueInfoConsumerProducerInfo GetProducerNode() const
bool IsOptionalGraphInput() const
< A wrapper around OrtApi::ValueInfo_IsOptionalGraphInput
Definition onnxruntime_cxx_api.h:1202
std::string GetDomain() const
std::string GetOperatorType() const
std::string GetName() const
Definition onnxruntime_cxx_api.h:1219
std::vector< ConstEpAssignedNode > GetNodes() const
Definition onnxruntime_cxx_api.h:1127
const char * EpName() const
const char * EpVendor() const
ConstKeyValuePairs EpOptions() const
ConstHardwareDevice Device() const
ConstMemoryInfo GetMemoryInfo(OrtDeviceMemoryType memory_type) const
Wraps EpDevice_MemoryInfo.
SyncStream CreateSyncStream(ConstKeyValuePairs stream_options={}) const
ConstKeyValuePairs EpMetadata() const
Definition onnxruntime_cxx_api.h:3336
void SetInputs(std::vector< ValueInfo > &inputs)
void SetOutputs(std::vector< ValueInfo > &outputs)
void AddNode(Node &node)
void AddInitializer(const std::string &name, Value &initializer, bool data_is_external)
Definition onnxruntime_cxx_api.h:1108
OrtHardwareDeviceType Type() const
const char * Vendor() const
ConstKeyValuePairs Metadata() const
Definition onnxruntime_cxx_api.h:2558
void BindOutput(const char *name, const Value &)
void BindInput(const char *name, const Value &)
void BindOutput(const char *name, const OrtMemoryInfo *)
Definition onnxruntime_cxx_api.h:947
void GetKeyValuePairs(std::vector< const char * > &keys, std::vector< const char * > &values) const
std::unordered_map< std::string, std::string > GetKeyValuePairs() const
const char * GetValue(const char *key) const
Definition onnxruntime_cxx_api.h:1964
ONNXTensorElementDataType GetMapKeyType() const
Wraps OrtApi::GetMapKeyType.
TypeInfo GetMapValueType() const
Wraps OrtApi::GetMapValueType.
Definition onnxruntime_cxx_api.h:986
std::string GetAllocatorName() const
Wrapper MemoryInfoGetName.
int GetDeviceId() const
Wrapper MemoryInfoGetId.
OrtMemType GetMemoryType() const
Wrapper MemoryInfoGetMemType.
OrtDeviceMemoryType GetDeviceMemoryType() const
Wrapper MemoryInfoGetDeviceMemType.
OrtMemoryInfoDeviceType GetDeviceType() const
Wrapper MemoryInfoGetDeviceType.
OrtAllocatorType GetAllocatorType() const
Wrapper MemoryInfoGetType.
uint32_t GetVendorId() const
Wrapper MemoryInfoGetVendorId.
bool operator==(const MemoryInfoImpl< U > &o) const
Definition onnxruntime_cxx_api.h:3376
void AddGraph(Graph &graph)
Definition onnxruntime_cxx_api.h:1951
TypeInfo GetOptionalElementType() const
Wraps OrtApi::CastOptionalTypeToContainedTypeInfo.
Definition onnxruntime_cxx_api.h:2040
const char ** str
Definition onnxruntime_cxx_api.h:2045
const int64_t * values_shape
Definition onnxruntime_cxx_api.h:2041
size_t values_shape_len
Definition onnxruntime_cxx_api.h:2042
const void * p_data
Definition onnxruntime_cxx_api.h:2044
Definition onnxruntime_cxx_api.h:1927
TypeInfo GetSequenceElementType() const
Wraps OrtApi::GetSequenceElementType.
Definition onnxruntime_cxx_api.h:1754
void SetEpDynamicOptions(const char *const *keys, const char *const *values, size_t kv_len)
Set DynamicOptions for EPs (Execution Providers)
AllocatedStringPtr EndProfilingAllocated(OrtAllocator *allocator)
End profiling and return a copy of the profiling file name.
void FinalizeModelEditorSession(const Model &model, const SessionOptions &options, OrtPrepackedWeightsContainer *prepacked_weights_container=nullptr)
void Run(const RunOptions &run_options, const IoBinding &)
Wraps OrtApi::RunWithBinding.
void RunAsync(const RunOptions &run_options, const char *const *input_names, const Value *input_values, size_t input_count, const char *const *output_names, Value *output_values, size_t output_count, RunAsyncCallbackFn callback, void *user_data)
Run the model asynchronously in a thread owned by intra op thread pool.
std::vector< Value > Run(const RunOptions &run_options, const char *const *input_names, const Value *input_values, size_t input_count, const char *const *output_names, size_t output_count)
Run the model returning results in an Ort allocated vector.
void Run(const RunOptions &run_options, const char *const *input_names, const Value *input_values, size_t input_count, const char *const *output_names, Value *output_values, size_t output_count)
Run the model returning results in user provided outputs Same as Run(const RunOptions&,...
Definition onnxruntime_cxx_api.h:2051
const int64_t * shape
Definition onnxruntime_cxx_api.h:2052
size_t shape_len
Definition onnxruntime_cxx_api.h:2053
Definition onnxruntime_cxx_api.h:3491
Status StoreWeightData(void **buffer_data_ptrs, size_t *buffer_sizes, size_t num_buffers)
Definition onnxruntime_cxx_api.h:1089
void * GetHandle()
Wraps SyncStream_GetHandle.
Definition onnxruntime_cxx_api.h:1877
size_t GetElementCount() const
Wraps OrtApi::GetTensorShapeElementCount.
void GetDimensions(int64_t *values, size_t values_count) const
Wraps OrtApi::GetDimensions.
std::vector< int64_t > GetShape() const
Uses GetDimensionsCount & GetDimensions to return a std::vector of the shape.
std::vector< const char * > GetSymbolicDimensions() const
void GetSymbolicDimensions(const char **values, size_t values_count) const
Wraps OrtApi::GetSymbolicDimensions.
size_t GetDimensionsCount() const
Wraps OrtApi::GetDimensionsCount.
ONNXTensorElementDataType GetElementType() const
Wraps OrtApi::GetTensorElementType.
bool HasShape() const
Wraps OrtApi::TensorTypeAndShape_HasShape.
Definition onnxruntime_cxx_api.h:1989
ONNXType GetONNXType() const
ConstSequenceTypeInfo GetSequenceTypeInfo() const
Wraps OrtApi::CastTypeInfoToSequenceTypeInfo.
ConstMapTypeInfo GetMapTypeInfo() const
Wraps OrtApi::CastTypeInfoToMapTypeInfo.
ConstOptionalTypeInfo GetOptionalTypeInfo() const
wraps OrtApi::CastTypeInfoToOptionalTypeInfo
ConstTensorTypeAndShapeInfo GetTensorTypeAndShapeInfo() const
Wraps OrtApi::CastTypeInfoToTensorInfo.
This is a tagging template type. Use it with Base<T> to indicate that the C++ interface object has no...
Definition onnxruntime_cxx_api.h:677
T Type
Definition onnxruntime_cxx_api.h:678
Definition onnxruntime_cxx_api.h:2226
void FillStringTensorElement(const char *s, size_t index)
Set a single string in a string tensor.
R * GetTensorMutableData()
Returns a non-const typed pointer to an OrtValue/Tensor contained buffer No type checking is performe...
R & At(const std::vector< int64_t > &location)
void UseBlockSparseIndices(const Shape &indices_shape, int32_t *indices_data)
Supplies BlockSparse format specific indices and marks the contained sparse tensor as being a BlockSp...
void FillSparseTensorBlockSparse(const OrtMemoryInfo *data_mem_info, const OrtSparseValuesParam &values, const Shape &indices_shape, const int32_t *indices_data)
The API will allocate memory using the allocator instance supplied to the CreateSparseTensor() API an...
void * GetTensorMutableRawData()
Returns a non-typed non-const pointer to a tensor contained data.
void UseCooIndices(int64_t *indices_data, size_t indices_num)
Supplies COO format specific indices and marks the contained sparse tensor as being a COO format tens...
void FillSparseTensorCoo(const OrtMemoryInfo *data_mem_info, const OrtSparseValuesParam &values_param, const int64_t *indices_data, size_t indices_num)
The API will allocate memory using the allocator instance supplied to the CreateSparseTensor() API an...
void FillStringTensor(const char *const *s, size_t s_len)
Set all strings at once in a string tensor.
void UseCsrIndices(int64_t *inner_data, size_t inner_num, int64_t *outer_data, size_t outer_num)
Supplies CSR format specific indices and marks the contained sparse tensor as being a CSR format tens...
void FillSparseTensorCsr(const OrtMemoryInfo *data_mem_info, const OrtSparseValuesParam &values, const int64_t *inner_indices_data, size_t inner_indices_num, const int64_t *outer_indices_data, size_t outer_indices_num)
The API will allocate memory using the allocator instance supplied to the CreateSparseTensor() API an...
char * GetResizedStringTensorElementBuffer(size_t index, size_t buffer_length)
Allocate if necessary and obtain a pointer to a UTF-8 encoded string element buffer indexed by the fl...
Memory allocation interface.
Definition onnxruntime_c_api.h:355
void(* Free)(struct OrtAllocator *this_, void *p)
Free a block of memory previously allocated with OrtAllocator::Alloc.
Definition onnxruntime_c_api.h:362
const OrtApi *(* GetApi)(uint32_t version)
Get a pointer to the requested version of the OrtApi.
Definition onnxruntime_c_api.h:920
The C API.
Definition onnxruntime_c_api.h:1145
const OrtEpApi *(* GetEpApi)(void)
Get the OrtEpApi instance for implementing an execution provider.
Definition onnxruntime_c_api.h:5618
const OrtInteropApi *(* GetInteropApi)(void)
Get the EP Interop API instance.
Definition onnxruntime_c_api.h:6862
const OrtCompileApi *(* GetCompileApi)(void)
Get the Compile API instance.
Definition onnxruntime_c_api.h:5350
void(* ReleaseTensorRTProviderOptions)(OrtTensorRTProviderOptionsV2 *input)
Release an OrtTensorRTProviderOptionsV2.
Definition onnxruntime_c_api.h:3401
const OrtModelEditorApi *(* GetModelEditorApi)(void)
Get the Model Editor API instance.
Definition onnxruntime_c_api.h:5292
void(* ReleaseCUDAProviderOptions)(OrtCUDAProviderOptionsV2 *input)
Release an OrtCUDAProviderOptionsV2.
Definition onnxruntime_c_api.h:3904
CUDA Provider Options.
Definition onnxruntime_c_api.h:620
The OrtCompileApi struct provides functions to compile ONNX models.
Definition onnxruntime_c_api.h:7752
Definition onnxruntime_c_api.h:7225
int(* GetVariadicInputHomogeneity)(const struct OrtCustomOp *op)
Definition onnxruntime_c_api.h:7271
OrtCustomOpInputOutputCharacteristic(* GetOutputCharacteristic)(const struct OrtCustomOp *op, size_t index)
Definition onnxruntime_c_api.h:7255
size_t(* GetInputTypeCount)(const struct OrtCustomOp *op)
Definition onnxruntime_c_api.h:7243
int(* GetVariadicOutputMinArity)(const struct OrtCustomOp *op)
Definition onnxruntime_c_api.h:7275
size_t(* GetAliasMap)(int **input_index, int **output_index)
Definition onnxruntime_c_api.h:7308
int(* GetStartVersion)(const struct OrtCustomOp *op)
Definition onnxruntime_c_api.h:7293
void(* ReleaseMayInplace)(int *input_index, int *output_index)
Definition onnxruntime_c_api.h:7305
const char *(* GetName)(const struct OrtCustomOp *op)
Definition onnxruntime_c_api.h:7236
size_t(* GetOutputTypeCount)(const struct OrtCustomOp *op)
Definition onnxruntime_c_api.h:7245
void(* KernelDestroy)(void *op_kernel)
Definition onnxruntime_c_api.h:7251
int(* GetVariadicOutputHomogeneity)(const struct OrtCustomOp *op)
Definition onnxruntime_c_api.h:7280
OrtMemType(* GetInputMemoryType)(const struct OrtCustomOp *op, size_t index)
Definition onnxruntime_c_api.h:7262
void *(* CreateKernel)(const struct OrtCustomOp *op, const OrtApi *api, const OrtKernelInfo *info)
Definition onnxruntime_c_api.h:7232
uint32_t version
Definition onnxruntime_c_api.h:7226
ONNXTensorElementDataType(* GetInputType)(const struct OrtCustomOp *op, size_t index)
Definition onnxruntime_c_api.h:7242
void(* ReleaseAliasMap)(int *input_index, int *output_index)
Definition onnxruntime_c_api.h:7309
OrtCustomOpInputOutputCharacteristic(* GetInputCharacteristic)(const struct OrtCustomOp *op, size_t index)
Definition onnxruntime_c_api.h:7254
const char *(* GetExecutionProviderType)(const struct OrtCustomOp *op)
Definition onnxruntime_c_api.h:7239
ONNXTensorElementDataType(* GetOutputType)(const struct OrtCustomOp *op, size_t index)
Definition onnxruntime_c_api.h:7244
int(* GetVariadicInputMinArity)(const struct OrtCustomOp *op)
Definition onnxruntime_c_api.h:7266
OrtStatusPtr(* InferOutputShapeFn)(const struct OrtCustomOp *op, OrtShapeInferContext *)
Definition onnxruntime_c_api.h:7290
int(* GetEndVersion)(const struct OrtCustomOp *op)
Definition onnxruntime_c_api.h:7294
OrtStatusPtr(* CreateKernelV2)(const struct OrtCustomOp *op, const OrtApi *api, const OrtKernelInfo *info, void **kernel)
Definition onnxruntime_c_api.h:7283
size_t(* GetMayInplace)(int **input_index, int **output_index)
Definition onnxruntime_c_api.h:7301
OrtStatusPtr(* KernelComputeV2)(void *op_kernel, OrtKernelContext *context)
Definition onnxruntime_c_api.h:7288
void(* KernelCompute)(void *op_kernel, OrtKernelContext *context)
Definition onnxruntime_c_api.h:7250
Configuration options for creating an OrtEnv.
Definition onnxruntime_c_api.h:1057
The OrtEpApi struct provides functions that are relevant to the implementation of an execution provid...
Definition onnxruntime_ep_c_api.h:751
The OrtEpFactory provides functions to create and manage execution providers.
Definition onnxruntime_ep_c_api.h:1786
The OrtEp struct provides functions to implement for an execution provider.
Definition onnxruntime_ep_c_api.h:1468
The OrtInteropApi struct provides functions for external resource interop with execution providers.
Definition onnxruntime_c_api.h:8025
MIGraphX Provider Options.
Definition onnxruntime_c_api.h:824
The OrtModelEditorApi struct provides functions to create or edit an ONNX model.
Definition onnxruntime_c_api.h:7323
OpenVINO Provider Options.
Definition onnxruntime_c_api.h:863
ROCM Provider Options.
Definition onnxruntime_c_api.h:707
TensorRT Provider Options.
Definition onnxruntime_c_api.h:796