updated runtime to work with in32 & float input

working
18 changed files with 571 additions and 219 deletions
--- a/.gitignore
+++ b/.gitignore
@ -1,5 +1,5 @@
 # Ignoring onnxruntime libs
-# /libs/onnxruntime/lib/*
+/libs/onnxruntime/lib/msys2/*

 example-*/config.make
 example-*/*.sln
--- a/.vscode/settings.json
+++ b/.vscode/settings.json
@ -0,0 +1,58 @@
+{
+    "files.associations": {
+        "xiosbase": "cpp",
+        "algorithm": "cpp",
+        "array": "cpp",
+        "atomic": "cpp",
+        "bit": "cpp",
+        "cctype": "cpp",
+        "clocale": "cpp",
+        "cmath": "cpp",
+        "compare": "cpp",
+        "concepts": "cpp",
+        "cstddef": "cpp",
+        "cstdint": "cpp",
+        "cstdio": "cpp",
+        "cstdlib": "cpp",
+        "cstring": "cpp",
+        "ctime": "cpp",
+        "cwchar": "cpp",
+        "exception": "cpp",
+        "functional": "cpp",
+        "initializer_list": "cpp",
+        "ios": "cpp",
+        "iosfwd": "cpp",
+        "iostream": "cpp",
+        "istream": "cpp",
+        "iterator": "cpp",
+        "limits": "cpp",
+        "list": "cpp",
+        "memory": "cpp",
+        "new": "cpp",
+        "numeric": "cpp",
+        "optional": "cpp",
+        "ostream": "cpp",
+        "stdexcept": "cpp",
+        "streambuf": "cpp",
+        "string": "cpp",
+        "system_error": "cpp",
+        "tuple": "cpp",
+        "type_traits": "cpp",
+        "typeinfo": "cpp",
+        "unordered_map": "cpp",
+        "unordered_set": "cpp",
+        "utility": "cpp",
+        "variant": "cpp",
+        "vector": "cpp",
+        "xfacet": "cpp",
+        "xhash": "cpp",
+        "xlocale": "cpp",
+        "xlocinfo": "cpp",
+        "xlocnum": "cpp",
+        "xmemory": "cpp",
+        "xstddef": "cpp",
+        "xstring": "cpp",
+        "xtr1common": "cpp",
+        "xutility": "cpp"
+    }
+}
--- a/addon_config.mk
+++ b/addon_config.mk
@ -1,11 +1,12 @@
 meta:
 	ADDON_NAME = ofxOnnxRuntime
 	ADDON_DESCRIPTION = "ONNX Runtime addon for OpenFrameworks"
-	ADDON_AUTHOR = Yuya Hanai
+	ADDON_AUTHOR = Cailean Finn
 	ADDON_TAGS = "ONNX"
-	ADDON_URL = https://github.com/hanasaan/ofxOnnxRuntime
+	ADDON_URL = https://github.com/caileannn/ofxOnnxRuntime

 common:
+	ADDON_DEPENDENCIES = ofxOpenCv
 	ADDON_INCLUDES = libs/onnxruntime/include
 	ADDON_INCLUDES += src
 osx:
--- a/libs/onnxruntime/include/onnxruntime_c_api.h
+++ b/libs/onnxruntime/include/onnxruntime_c_api.h
@ -38,7 +38,7 @@
 *
 * This value is used by some API functions to behave as this version of the header expects.
 */
-#define ORT_API_VERSION 21
+#define ORT_API_VERSION 20

 #ifdef __cplusplus
 extern "C" {
@ -46,7 +46,7 @@ extern "C" {

 //! @}
 // SAL2 Definitions
-#ifndef _MSC_VER
+#ifndef _WIN32
 #define _In_
 #define _In_z_
 #define _In_opt_
@ -626,13 +626,8 @@ typedef struct OrtMIGraphXProviderOptions {
 } OrtMIGraphXProviderOptions;

 /** \brief OpenVINO Provider Options
- *  \brief This Struct is frozen since ORT 1.13.0. Its maintained part of Legacy API for compatibility.
- *  \brief For latest OpenVINO Provider Options update to the ProviderOptions map.
- *  \brief Latest OpenVINO Provider Options are listed in the
- *  \htmlonly
- *  <a href="https://onnxruntime.ai/docs/execution-providers/OpenVINO-ExecutionProvider.html#summary-of-options">onnxruntime document.</a>
- *  \endhtmlonly
- * \see OrtApi::SessionOptionsAppendExecutionProvider()
+ *
+ * \see OrtApi::SessionOptionsAppendExecutionProvider_OpenVINO
 */
 typedef struct OrtOpenVINOProviderOptions {
 #ifdef __cplusplus
@ -650,7 +645,7 @@ typedef struct OrtOpenVINOProviderOptions {
   * Valid settings are one of: "CPU_FP32", "CPU_FP16", "GPU_FP32", "GPU_FP16"
   */
  const char* device_type;
-  unsigned char enable_npu_fast_compile;  ///< 0 = disabled, nonzero = enabled
+  unsigned char enable_npu_fast_compile;
  const char* device_id;
  size_t num_of_threads;  ///< 0 = Use default number of threads
  const char* cache_dir;  // path is set to empty by default
@ -3665,19 +3660,8 @@ struct OrtApi {
   *     - "1": Enabled.
   *   "offload_graph_io_quantization": Offload graph input quantization and graph output dequantization to another
   *   execution provider (typically CPU EP).
-   *     - "0": Disabled. QNN EP will handle quantization and dequantization of graph I/O.
-   *     - "1": Enabled. This is the default value.
-   *   "enable_htp_spill_fill_buffer": Enable HTP spill fill buffer setting. The flag is used while generating context binary.
-   *     - "0": Default. Disabled.
-   *     - "1": Enabled.
-   *   "enable_htp_shared_memory_allocator": Enable the QNN HTP shared memory allocator. Requires libcdsprpc.so/dll to
-   *   be available.
-   *     - "0": Default. Disabled.
+   *     - "0": Default. Disabled. QNN EP will handle quantization and dequantization of graph I/O.
   *     - "1": Enabled.
-   *   "dump_json_qnn_graph": Set to "1" to dump QNN graphs generated by QNN EP as JSON files. Each graph partition
-   *      assigned to QNN EP is dumped to a separate file.
-   *   "json_qnn_graph_dir": Directory in which to dump QNN JSON graphs. If not specified, QNN graphs are dumped in the
-   *      program's current working directory. Ignored if "dump_json_qnn_graph" is not set.
   *
   * SNPE supported keys:
   *   "runtime": SNPE runtime engine, options: "CPU", "CPU_FLOAT32", "GPU", "GPU_FLOAT32_16_HYBRID", "GPU_FLOAT16",
@ -4623,8 +4607,6 @@ struct OrtApi {
   * \param[in] num_keys
   *
   * \snippet{doc} snippets.dox OrtStatus Return Value
-   *
-   * \since Version 1.17.
   */
  ORT_API2_STATUS(SessionOptionsAppendExecutionProvider_OpenVINO_V2,
                  _In_ OrtSessionOptions* options,
@ -4642,8 +4624,6 @@ struct OrtApi {
   * \param[in] num_keys
   *
   * \snippet{doc} snippets.dox OrtStatus Return Value
-   *
-   * \since Version 1.18.
   */
  ORT_API2_STATUS(SessionOptionsAppendExecutionProvider_VitisAI,
                  _In_ OrtSessionOptions* options,
@ -4657,10 +4637,7 @@ struct OrtApi {
   *  \param[in] mem_info OrtMemoryInfo instance
   *  \param[in] count_or_bytes How many bytes is this scratch buffer
   *  \param[out] out A pointer to the scrach buffer
-   *
   *  \snippet{doc} snippets.dox OrtStatus Return Value
-   *
-   * \since Version 1.18.
   */
  ORT_API2_STATUS(KernelContext_GetScratchBuffer, _In_ const OrtKernelContext* context, _In_ const OrtMemoryInfo* mem_info, _In_ size_t count_or_bytes, _Outptr_ void** out);

@ -4671,8 +4648,6 @@ struct OrtApi {
   * \param[out] out A pointer to OrtAllocator
   *
   * \snippet{doc} snippets.dox OrtStatus Return Value
-   *
-   * \since Version 1.18.
   */
  ORT_API2_STATUS(KernelInfoGetAllocator, _In_ const OrtKernelInfo* info, _In_ OrtMemType mem_type, _Outptr_ OrtAllocator** out);

@ -4694,8 +4669,6 @@ struct OrtApi {
   * \param[in] num_external_initializer_files Number of external files
   *
   * \snippet{doc} snippets.dox OrtStatus Return Value
-   *
-   * \since Version 1.18.
   */
  ORT_API2_STATUS(AddExternalInitializersFromFilesInMemory, _In_ OrtSessionOptions* options,
                  _In_reads_(num_external_initializer_files) const ORTCHAR_T* const* external_initializer_file_names,
@ -4718,8 +4691,6 @@ struct OrtApi {
   *                  OrtApi::ReleaseLoraAdapter.
   *
   * \snippet{doc} snippets.dox OrtStatus Return Value
-   *
-   * \since Version 1.20.
   */
  ORT_API2_STATUS(CreateLoraAdapter, const ORTCHAR_T* adapter_file_path, _In_ OrtAllocator* allocator,
                  _Outptr_ OrtLoraAdapter** out);
@ -4738,8 +4709,6 @@ struct OrtApi {
   *                  OrtApi::ReleaseLoraAdapter.
   *
   * \snippet{doc} snippets.dox OrtStatus Return Value
-   *
-   * \since Version 1.20.
   */
  ORT_API2_STATUS(CreateLoraAdapterFromArray, _In_ const void* bytes, size_t num_bytes, _In_ OrtAllocator* allocator,
                  _Outptr_ OrtLoraAdapter** out);
@ -4761,8 +4730,6 @@ struct OrtApi {
   * \param[in] adapter OrtLoraAdapter instance
   *
   * \snippet{doc} snippets.dox OrtStatus Return Value
-   *
-   * \since Version 1.20.
   */
  ORT_API2_STATUS(RunOptionsAddActiveLoraAdapter, _Inout_ OrtRunOptions* options, _In_ const OrtLoraAdapter* adapter);

@ -4781,8 +4748,6 @@ struct OrtApi {
   * \param[in] kv_len Number of elements in the keys and values arrays
   *
   * \snippet{doc} snippets.dox OrtStatus Return Value
-   *
-   * \since Version 1.20.
   */
  ORT_API2_STATUS(SetEpDynamicOptions, _Inout_ OrtSession* sess, _In_reads_(kv_len) const char* const* keys,
                  _In_reads_(kv_len) const char* const* values, _In_ size_t kv_len);
--- a/libs/onnxruntime/include/onnxruntime_cxx_api.h
+++ b/libs/onnxruntime/include/onnxruntime_cxx_api.h
@ -650,9 +650,6 @@ using AllocatedStringPtr = std::unique_ptr<char, detail::AllocatedFree>;
 *  constructors to construct an instance of a Status object from exceptions.
 */
 struct Status : detail::Base<OrtStatus> {
-  using Base = detail::Base<OrtStatus>;
-  using Base::Base;
-
  explicit Status(std::nullptr_t) noexcept {}               ///< Create an empty object, must be assigned a valid one to be used
  explicit Status(OrtStatus* status) noexcept;              ///< Takes ownership of OrtStatus instance returned from the C API.
  explicit Status(const Exception&) noexcept;               ///< Creates status instance out of exception
@ -731,9 +728,6 @@ struct Env : detail::Base<OrtEnv> {
 *
 */
 struct CustomOpDomain : detail::Base<OrtCustomOpDomain> {
-  using Base = detail::Base<OrtCustomOpDomain>;
-  using Base::Base;
-
  explicit CustomOpDomain(std::nullptr_t) {}  ///< Create an empty CustomOpDomain object, must be assigned a valid one to be used

  /// \brief Wraps OrtApi::CreateCustomOpDomain
@ -969,10 +963,8 @@ struct SessionOptions : detail::SessionOptionsImpl<OrtSessionOptions> {
 *
 */
 struct ModelMetadata : detail::Base<OrtModelMetadata> {
-  using Base = detail::Base<OrtModelMetadata>;
-  using Base::Base;
-
-  explicit ModelMetadata(std::nullptr_t) {}  ///< Create an empty ModelMetadata object, must be assigned a valid one to be used
+  explicit ModelMetadata(std::nullptr_t) {}                                   ///< Create an empty ModelMetadata object, must be assigned a valid one to be used
+  explicit ModelMetadata(OrtModelMetadata* p) : Base<OrtModelMetadata>{p} {}  ///< Used for interop with the C API

  /** \brief Returns a copy of the producer name.
   *
@ -1245,9 +1237,6 @@ using ConstTensorTypeAndShapeInfo = detail::TensorTypeAndShapeInfoImpl<detail::U
 *
 */
 struct TensorTypeAndShapeInfo : detail::TensorTypeAndShapeInfoImpl<OrtTensorTypeAndShapeInfo> {
-  using Base = detail::TensorTypeAndShapeInfoImpl<OrtTensorTypeAndShapeInfo>;
-  using Base::Base;
-
  explicit TensorTypeAndShapeInfo(std::nullptr_t) {}                                                ///< Create an empty TensorTypeAndShapeInfo object, must be assigned a valid one to be used
  explicit TensorTypeAndShapeInfo(OrtTensorTypeAndShapeInfo* p) : TensorTypeAndShapeInfoImpl{p} {}  ///< Used for interop with the C API
  ConstTensorTypeAndShapeInfo GetConst() const { return ConstTensorTypeAndShapeInfo{this->p_}; }
@ -1269,9 +1258,6 @@ using ConstSequenceTypeInfo = detail::SequenceTypeInfoImpl<detail::Unowned<const
 *
 */
 struct SequenceTypeInfo : detail::SequenceTypeInfoImpl<OrtSequenceTypeInfo> {
-  using Base = detail::SequenceTypeInfoImpl<OrtSequenceTypeInfo>;
-  using Base::Base;
-
  explicit SequenceTypeInfo(std::nullptr_t) {}                                                         ///< Create an empty SequenceTypeInfo object, must be assigned a valid one to be used
  explicit SequenceTypeInfo(OrtSequenceTypeInfo* p) : SequenceTypeInfoImpl<OrtSequenceTypeInfo>{p} {}  ///< Used for interop with the C API
  ConstSequenceTypeInfo GetConst() const { return ConstSequenceTypeInfo{this->p_}; }
@ -1307,9 +1293,6 @@ using ConstMapTypeInfo = detail::MapTypeInfoImpl<detail::Unowned<const OrtMapTyp
 *
 */
 struct MapTypeInfo : detail::MapTypeInfoImpl<OrtMapTypeInfo> {
-  using Base = detail::MapTypeInfoImpl<OrtMapTypeInfo>;
-  using Base::Base;
-
  explicit MapTypeInfo(std::nullptr_t) {}                                          ///< Create an empty MapTypeInfo object, must be assigned a valid one to be used
  explicit MapTypeInfo(OrtMapTypeInfo* p) : MapTypeInfoImpl<OrtMapTypeInfo>{p} {}  ///< Used for interop with the C API
  ConstMapTypeInfo GetConst() const { return ConstMapTypeInfo{this->p_}; }
@ -1341,9 +1324,6 @@ using ConstTypeInfo = detail::TypeInfoImpl<detail::Unowned<const OrtTypeInfo>>;
 /// the information about contained sequence or map depending on the ONNXType.
 /// </summary>
 struct TypeInfo : detail::TypeInfoImpl<OrtTypeInfo> {
-  using Base = detail::TypeInfoImpl<OrtTypeInfo>;
-  using Base::Base;
-
  explicit TypeInfo(std::nullptr_t) {}                                 ///< Create an empty TypeInfo object, must be assigned a valid one to be used
  explicit TypeInfo(OrtTypeInfo* p) : TypeInfoImpl<OrtTypeInfo>{p} {}  ///< C API Interop

@ -1681,11 +1661,11 @@ using UnownedValue = detail::ValueImpl<detail::Unowned<OrtValue>>;
 */
 struct Value : detail::ValueImpl<OrtValue> {
  using Base = detail::ValueImpl<OrtValue>;
-  using Base::Base;
  using OrtSparseValuesParam = detail::OrtSparseValuesParam;
  using Shape = detail::Shape;

-  explicit Value(std::nullptr_t) {}  ///< Create an empty Value object, must be assigned a valid one to be used
+  explicit Value(std::nullptr_t) {}         ///< Create an empty Value object, must be assigned a valid one to be used
+  explicit Value(OrtValue* p) : Base{p} {}  ///< Used for interop with the C API
  Value(Value&&) = default;
  Value& operator=(Value&&) = default;

@ -1961,10 +1941,6 @@ struct ArenaCfg : detail::Base<OrtArenaCfg> {
 /// This struct provides life time management for custom op attribute
 /// </summary>
 struct OpAttr : detail::Base<OrtOpAttr> {
-  using Base = detail::Base<OrtOpAttr>;
-  using Base::Base;
-
-  explicit OpAttr(std::nullptr_t) {}
  OpAttr(const char* name, const void* data, int len, OrtOpAttrType type);
 };

@ -2130,10 +2106,10 @@ struct KernelContext {
  explicit KernelContext(OrtKernelContext* context);
  size_t GetInputCount() const;
  size_t GetOutputCount() const;
-  // If input is optional and is not present, the method returns an empty ConstValue
+  // If input is optional and is not present, the method returns en empty ConstValue
  // which can be compared to nullptr.
  ConstValue GetInput(size_t index) const;
-  // If output is optional and is not present, the method returns an empty UnownedValue
+  // If outout is optional and is not present, the method returns en empty UnownedValue
  // which can be compared to nullptr.
  UnownedValue GetOutput(size_t index, const int64_t* dim_values, size_t dim_count) const;
  UnownedValue GetOutput(size_t index, const std::vector<int64_t>& dims) const;
@ -2207,8 +2183,6 @@ using ConstKernelInfo = detail::KernelInfoImpl<detail::Unowned<const OrtKernelIn
 /// so it does not destroy the pointer the kernel does not own.
 /// </summary>
 struct KernelInfo : detail::KernelInfoImpl<OrtKernelInfo> {
-  using Base = detail::KernelInfoImpl<OrtKernelInfo>;
-  using Base::Base;
  explicit KernelInfo(std::nullptr_t) {}     ///< Create an empty instance to initialize later
  explicit KernelInfo(OrtKernelInfo* info);  ///< Take ownership of the instance
  ConstKernelInfo GetConst() const { return ConstKernelInfo{this->p_}; }
@ -2218,9 +2192,6 @@ struct KernelInfo : detail::KernelInfoImpl<OrtKernelInfo> {
 /// Create and own custom defined operation.
 /// </summary>
 struct Op : detail::Base<OrtOp> {
-  using Base = detail::Base<OrtOp>;
-  using Base::Base;
-
  explicit Op(std::nullptr_t) {}  ///< Create an empty Operator object, must be assigned a valid one to be used

  explicit Op(OrtOp*);  ///< Take ownership of the OrtOp
--- a/libs/onnxruntime/include/onnxruntime_cxx_inline.h
+++ b/libs/onnxruntime/include/onnxruntime_cxx_inline.h
@ -51,7 +51,7 @@ inline void ThrowOnError(const Status& st) {
  }
 }

-inline Status::Status(OrtStatus* status) noexcept : detail::Base<OrtStatus>{status} {
+inline Status::Status(OrtStatus* status) noexcept : Base<OrtStatus>{status} {
 }

 inline Status::Status(const std::exception& e) noexcept {
@ -1908,7 +1908,7 @@ inline void attr_utils::GetAttrs(const OrtKernelInfo* p, const char* name, std::

 inline KernelInfo::KernelInfo(OrtKernelInfo* info) : detail::KernelInfoImpl<OrtKernelInfo>{info} {}

-inline Op::Op(OrtOp* p) : detail::Base<OrtOp>(p) {}
+inline Op::Op(OrtOp* p) : Base<OrtOp>(p) {}

 inline Op Op::Create(const OrtKernelInfo* info, const char* op_name, const char* domain, int version,
                     const char** type_constraint_names,
--- a/libs/onnxruntime/include/onnxruntime_session_options_config_keys.h
+++ b/libs/onnxruntime/include/onnxruntime_session_options_config_keys.h
@ -250,51 +250,6 @@ static const char* const kOrtSessionOptionsOptimizedModelExternalInitializersFil
 static const char* const kOrtSessionOptionsOptimizedModelExternalInitializersMinSizeInBytes =
    "session.optimized_model_external_initializers_min_size_in_bytes";

-// When loading model from memory buffer and the model has external initializers
-// Use this config to set the external data file folder path
-// All external data files should be in the same folder
-static const char* const kOrtSessionOptionsModelExternalInitializersFileFolderPath =
-    "session.model_external_initializers_file_folder_path";
-
-// Use this config when saving pre-packed constant initializers to an external data file.
-// This allows you to memory map pre-packed initializers on model load and leave it to
-// to the OS the amount of memory consumed by the pre-packed initializers. Otherwise,
-// pre-packed data resides on the heap.
-//
-// - "0": Default is not save pre-packed initializers to a data file.
-// - "1": Save pre-packed constant initializers to an external data file.
-// Sample usage: sess_options.add_session_config_entry(kOrtSessionOptionsSavePrePackedConstantInitializers,  "1")
-static const char* const kOrtSessionOptionsSavePrePackedConstantInitializers =
-    "session.save_external_prepacked_constant_initializers";
-
-// Use this config when you want to collect memory stats for each node in the graph.
-// The file format is a CSV file with the following columns:
-// The file will be created if it does not exist, and will be overwritten if it does.
-//
-// The content of the file can be used to estimate memory requirements at run time including
-// the temporary allocations. This operation is preferably done on a CPU device, as the model may exceed
-// device memory limits in constrained environments. When enabling this option, it is important to disable
-// memory patterns, as they tend to allocate large blocks to avoid fragmentation and accommodate needs of multiple
-// kernels. Memory patterns may make it difficult to allocate on a device with limited memory.
-//
-// The collected stats then can be used to partition the graph among the devices in a way that only the
-// required memory is allocated on each device.
-//
-// node_name, initializers_memory, dynamic_outputs_sizes, temp_allocations_size
-//
-// - "full path to file": there is not a default for this option. If the file can not be opened for writing, an error will be returned.
-static const char* const kOrtSessionOptionsCollectNodeMemoryStatsToFile = "session.collect_node_memory_stats_to_file";
-
-/// This is a composite CSV setting formatted as "memory limit in kb,file name for collected stats"
-/// "limit > 0": enables Capacity Aware Partitioning for Cuda EP. `limit` is optional and when absent
-/// the provider may attempt to figure out the memory available automatically.
-/// The setting with no limit is expected to look like: ",file name for collected stats"
-///  The EP will place nodes on device "file name" :
-/// this file is expected to be found at the same folder with the model. The file contains
-/// pre-recorded stats collected when running with kOrtSessionOptionsCollectNodeMemoryStatsToFile enforce (see above)
-static const char* const kOrtSessionOptionsResourceCudaPartitioningSettings =
-    "session.resource_cuda_partitioning_settings";
-
 // Enable EP context feature to dump the partitioned graph which includes the EP context into Onnx file.
 // The dumped Onnx model with EP context can be used for future inference to avoid the EP graph partitioning/compile overhead.
 // "0": disable. (default)
@ -303,12 +258,11 @@ static const char* const kOrtSessionOptionEpContextEnable = "ep.context_enable";

 // Specify the file path for the Onnx model which has EP context.
 // Default to original_file_name_ctx.onnx if not specified
-// Folder is not a valid option
 static const char* const kOrtSessionOptionEpContextFilePath = "ep.context_file_path";

 // Flag to specify whether to dump the EP context into the Onnx model.
-// "0": dump the EP context into separate file, keep the file name in the Onnx model. (default).
-// "1": dump the EP context into the Onnx model.
+// "0": dump the EP context into separate file, keep the file name in the Onnx model.
+// "1": dump the EP context into the Onnx model. (default).
 static const char* const kOrtSessionOptionEpContextEmbedMode = "ep.context_embed_mode";

 // Specify the EPContext node name prefix to make it unique
@ -318,11 +272,6 @@ static const char* const kOrtSessionOptionEpContextNodeNamePrefix = "ep.context_
 // Share EP related resources across EPs
 static const char* const kOrtSessionOptionShareEpContexts = "ep.share_ep_contexts";

-// Use this config when dumping EP context model with an external initializers file
-// All initializers will be inside the external data file if specified, otherwise all in Onnx file
-static const char* const kOrtSessionOptionsEpContextModelExternalInitializersFileName =
-    "ep.context_model_external_initializers_file_name";
-
 // Gemm fastmath mode provides fp32 gemm acceleration with bfloat16 based matmul.
 // Option values:
 // - "0": Gemm FastMath mode is not enabled. [DEFAULT]
--- a/libs/onnxruntime/lib/msys2/onnxruntime.dll
+++ b/libs/onnxruntime/lib/msys2/onnxruntime.dll
--- a/libs/onnxruntime/lib/msys2/onnxruntime.lib
+++ b/libs/onnxruntime/lib/msys2/onnxruntime.lib
--- a/libs/onnxruntime/lib/msys2/onnxruntime_providers_cuda.dll
+++ b/libs/onnxruntime/lib/msys2/onnxruntime_providers_cuda.dll
--- a/libs/onnxruntime/lib/msys2/onnxruntime_providers_cuda.lib
+++ b/libs/onnxruntime/lib/msys2/onnxruntime_providers_cuda.lib
--- a/libs/onnxruntime/lib/msys2/onnxruntime_providers_shared.dll
+++ b/libs/onnxruntime/lib/msys2/onnxruntime_providers_shared.dll
--- a/libs/onnxruntime/lib/msys2/onnxruntime_providers_shared.lib
+++ b/libs/onnxruntime/lib/msys2/onnxruntime_providers_shared.lib
--- a/libs/onnxruntime/lib/msys2/onnxruntime_providers_tensorrt.dll
+++ b/libs/onnxruntime/lib/msys2/onnxruntime_providers_tensorrt.dll
--- a/libs/onnxruntime/lib/msys2/onnxruntime_providers_tensorrt.lib
+++ b/libs/onnxruntime/lib/msys2/onnxruntime_providers_tensorrt.lib
--- a/src/ofxOnnxRuntime.cpp
+++ b/src/ofxOnnxRuntime.cpp
@ -1,5 +1,4 @@
 #include "ofxOnnxRuntime.h"
-#include "ofMain.h"

 namespace ofxOnnxRuntime
 {
@ -15,9 +14,12 @@ namespace ofxOnnxRuntime
 		return wstr;
 	}
 #endif
-
-	void BaseHandler::setup(const std::string & onnx_path, const BaseSetting & base_setting, const std::vector<int64_t>& batched_dims, const int & batch_size)
+	void BaseHandler::setup(const std::string & onnx_path, const BaseSetting & base_setting, const int & batch_size, const bool debug, const bool timestamp)
 	{
+		// Store data types
+		this->input_dtype = base_setting.input_dtype;
+		this->output_dtype = base_setting.output_dtype;
+
 		Ort::SessionOptions session_options;
 		session_options.SetIntraOpNumThreads(1);
 		session_options.SetIntraOpNumThreads(1);
@ -32,9 +34,9 @@ namespace ofxOnnxRuntime
 			session_options.AppendExecutionProvider_CUDA(opts);
 		}

-		// Sets batch size
+		this->timestamp = timestamp;
+		this->debug = debug;
 		this->batch_size = batch_size;
-		this->batched_dims = batched_dims;
 		this->setup2(onnx_path, session_options);
 	}

@ -46,7 +48,11 @@ namespace ofxOnnxRuntime

 		ort_session = std::make_shared<Ort::Session>(ort_env, wpath.c_str(), session_options);

+		setNames();
+	}

+	void BaseHandler::setNames()
+	{
 		Ort::AllocatorWithDefaultOptions allocator;

 		// 1. Gets Input Name/s & Shape ([1, 3, 28, 28]) -- In most cases this is usually just one
@ -55,22 +61,17 @@ namespace ofxOnnxRuntime
 			input_node_dims = ort_session->GetInputTypeInfo(i).GetTensorTypeAndShapeInfo().GetShape();

 			// Some models might have negative shape values to indicate dynamic shape, e.g., for variable batch size. (?, 3, 28, 28) -> (1, 3, 28, 28)
-			for (auto& s : input_node_dims) if (s < 0) s = 1;
+			for (auto& s : input_node_dims) if (s < 0) s = batch_size;

-			std::cout << input_node_names.at(i) << " : " << PrintShape(input_node_dims) << std::endl;
+			if (debug) std::cout << input_node_names.at(i) << " : " << PrintShape(input_node_dims) << std::endl;
 		}

 		// 2. Calculate the product of the dimensions
-		for (auto& f : batched_dims) {
+		for (auto& f : input_node_dims) {
 			input_node_size *= f;
 		}

-		// 3. Resize input values array to match input tensor/s
-		input_values_handler.resize(batch_size);
-
-		for (auto& tensor : input_values_handler) {
-			tensor.resize(input_node_size);
-		}
+		if (debug)  ofLog() << ofToString(input_node_size) + ", Batch Size:" + ofToString(input_node_dims[0]);

 		// 2. Clear up output values
 		output_node_dims.clear();
@ -83,27 +84,53 @@ namespace ofxOnnxRuntime
 			
 			output_values.emplace_back(nullptr);

-			std::cout << output_node_names.at(i) << " : " << PrintShape(output_shapes) << std::endl;
+			if (debug) std::cout << output_node_names.at(i) << " : " << PrintShape(output_shapes) << std::endl;
 		}
 	}

-	std::vector<Ort::Value>& BaseHandler::run()
+	float* BaseHandler::run()
 	{
+		
+		auto start = std::chrono::high_resolution_clock::now(); // starting timestamp
+
 		std::vector<Ort::Value> input_tensors;

+		size_t num_images = input_imgs.size();
+
+		if(input_imgs.size() != batch_size) {
+			ofLog() << "Input images do not match batch size. Inference FAILED.";
+			return dummy_output_tensor.front().GetTensorMutableData<float>();
+		}
+
 		// 1. Create 1-D array for all values to create tensor & push all values from input_vals to batch_vals
-		std::vector<float> batch_values(input_node_size * batch_size);
+		std::vector<float> batch_values;
+		batch_values.resize(input_node_size * batch_size); // Reserve space but don't initialize

-		for (const auto& inner_vec : input_values_handler) {
-			for (float value : inner_vec) {
-				batch_values.push_back(value);
+		std::vector<int32_t> batch_values_int;
+		batch_values_int.resize(input_node_size * batch_size); // Reserve space but don't initialize
+
+		if (input_dtype == ModelDataType::FLOAT32){
+			// I have a list of imgs, these need to be converted from images into input for the model (int or float)
+			for(size_t i = 0; i < batch_size; i++) {
+				convertImageToMatFloat(input_imgs[i], batch_values, i);
 			}
+
+			// 2. Create tensor with batch values { input data, input size, model input dims, model input size}
+			input_tensors.emplace_back(Ort::Value::CreateTensor<float>(
+				memory_info_handler, batch_values.data(), input_node_size,
+				input_node_dims.data(), input_node_dims.size()));
 		} 
+		else if (input_dtype == ModelDataType::INT32) {
+			// I have a list of imgs, these need to be converted from images into input for the model (int or float)
+			for(size_t i = 0; i < batch_size; i++) {
+				convertImageToMatInt32(input_imgs[i], batch_values_int, i);
+			}

-		// 2. Create tensor with batch values { input data, input size, model input dims, model input size}
-		input_tensors.emplace_back(Ort::Value::CreateTensor<float>(
-			memory_info_handler, batch_values.data(), input_node_size,
+			// 2. Create tensor with batch values { input data, input size, model input dims, model input size}
+			input_tensors.emplace_back(Ort::Value::CreateTensor<int32_t>(
+			memory_info_handler, batch_values_int.data(), input_node_size,
 			input_node_dims.data(), input_node_dims.size()));
+		}

 		// transform std::string -> const char*
 		std::vector<const char*> input_names_char(input_node_names.size(), nullptr);
@ -114,6 +141,11 @@ namespace ofxOnnxRuntime
 		std::transform(std::begin(output_node_names), std::end(output_node_names), std::begin(output_names_char),
 			[&](const std::string& str) { return str.c_str(); });
 		
+			// Before running the model, check if we have data
+		if (input_dtype == ModelDataType::INT32 && batch_values_int.empty()) {
+			ofLog() << "Error: INT32 batch values vector is empty";
+			return dummy_output_tensor.front().GetTensorMutableData<float>();
+		}

 		try {
 			// 3. Run inference, { in names, input data, num of inputs, output names, num of outputs }
@ -122,13 +154,103 @@ namespace ofxOnnxRuntime
 				input_names_char.size(), output_names_char.data(), 
 				output_names_char.size());
 			
-			return output_values;
-		}
-		catch (const Ort::Exception& ex) {
+			if (debug) {
+				// Gets the address of the first value
+				auto& out = output_values.front();
+				// Get tensor shape information
+				Ort::TensorTypeAndShapeInfo info = out.GetTensorTypeAndShapeInfo();
+				std::vector<int64_t> output_dims = info.GetShape();
+				
+				// Print the dimensions
+				std::cout << "Output tensor dimensions: [";
+				for (size_t i = 0; i < output_dims.size(); i++) {
+					std::cout << output_dims[i];
+					if (i < output_dims.size() - 1) {
+						std::cout << ", ";
+					}
+				}
+				std::cout << "]" << std::endl;
+				
+				// Optional: Print total number of elements
+				size_t total_elements = 1;
+				for (auto& dim : output_dims) {
+					if (dim > 0) {  // Handle dynamic dimensions
+						total_elements *= static_cast<size_t>(dim);
+					}
+				}
+				std::cout << "Total elements: " << total_elements << std::endl;
+			}
+			
+			if (timestamp) {
+				auto end = std::chrono::high_resolution_clock::now();
+				std::chrono::duration<double, std::milli> elapsed = end - start;
+				std::cout << "Update loop took " << elapsed.count() << " ms" << std::endl;
+			}
+
+			return output_values.front().GetTensorMutableData<float>();
+
+		} catch (const Ort::Exception& ex) {
 			std::cout << "ERROR running model inference: " << ex.what() << std::endl;
-			return dummy_output_tensor;
+			return dummy_output_tensor.front().GetTensorMutableData<float>();
+		}
+		
+	}
+
+	/*
+	*
+	*	Utilties (｡･∀･)ﾉﾞ
+	*
+	*/
+
+	// Add separate methods for float and int32 conversion
+    void BaseHandler::convertImageToMatFloat(ofImage* img, std::vector<float>& values, size_t& idx) {
+        // Your existing conversion code for float
+        ofPixels& pix = img->getPixels();
+        int width = img->getWidth();
+        int height = img->getHeight();
+        int channels = pix.getNumChannels();
+
+        cv::Mat cvImage = cv::Mat(height, width, (channels == 3) ? CV_8UC3 : CV_8UC1, pix.getData());
+        cv::InputArray inputArray(cvImage);
+        image_array = cv::dnn::blobFromImage(inputArray, 1 / 255.0, cv::Size(input_node_dims[2], input_node_dims[3]), (0, 0, 0), false, false);
+
+        std::memcpy(
+            values.data() + idx * channels * width * height,
+            image_array.data,
+            channels * width * height * sizeof(float)
+        );
+    }
+
+    void BaseHandler::convertImageToMatInt32(ofImage* img, std::vector<int32_t>& values, size_t& idx) {
+        ofPixels& pix = img->getPixels();
+		int width = img->getWidth();
+		int height = img->getHeight();
+		int channels = pix.getNumChannels();
+		
+		cv::Mat cvImage = cv::Mat(height, width, (channels == 3) ? CV_8UC3 : CV_8UC1, pix.getData());
+		
+		// Create blob with the correct dimensions
+		cv::Mat floatMat = cv::dnn::blobFromImage(cvImage, 1/255.0, 
+												cv::Size(256, 256), 
+												cv::Scalar(0, 0, 0), false, false);
+		
+		// Convert float blob to int32
+		cv::Mat intMat;
+		floatMat.convertTo(intMat, CV_32S);
+		
+		// Calculate how many values we need to add
+		size_t elementsPerImage = channels * 256* 256;
+		size_t startPos = idx * elementsPerImage;
+		
+		// Copy data from intMat to values
+		int32_t* intData = (int32_t*)intMat.data;
+		for (size_t i = 0; i < elementsPerImage; i++) {
+			values[startPos + i] = intData[i];
 		}
+    }

+	void BaseHandler::setInputs(std::vector<ofImage*>& in) {
+		this->input_imgs = in;
 	}

 	// Prints the shape of the given tensor (ex. input: (1, 1, 512, 512))
@ -176,9 +298,6 @@ namespace ofxOnnxRuntime
 	}

 	Ort::Value BaseHandler::VectorToTensor(std::vector<float>& data, const std::vector<int64_t>& shape) {
-		//// Allocate memory using CPU memory allocator
-		//Ort::MemoryInfo mem_info = Ort::MemoryInfo::CreateCpu(OrtAllocatorType::OrtArenaAllocator, OrtMemType::OrtMemTypeDefault);
-
 		// Create a tensor from the provided data, shape, and memory info
 		auto tensor = Ort::Value::CreateTensor<float>(memory_info_handler, data.data(), data.size(), shape.data(), shape.size());

--- a/src/ofxOnnxRuntime.h
+++ b/src/ofxOnnxRuntime.h
@ -1,6 +1,8 @@
 #pragma once

 #include <onnxruntime_cxx_api.h>
+#include "ofMain.h"
+#include "ofxOpenCv.h"

 namespace ofxOnnxRuntime
 {
@ -11,53 +13,67 @@ namespace ofxOnnxRuntime
 		INFER_TENSORRT
 	};

+	enum ModelDataType {
+		FLOAT32,
+		INT32
+	};
+
 	struct BaseSetting
 	{
 		InferType infer_type;
 		int device_id;
+		ModelDataType input_dtype = FLOAT32;
+		ModelDataType output_dtype = FLOAT32;
 	};

 	class BaseHandler
 	{
-	public:
-		BaseHandler() {}
+		public:
+			BaseHandler() {}

-		void setup(const std::string& onnx_path, const BaseSetting& base_setting = BaseSetting{ INFER_CPU, 0 }, const std::vector<int64_t>& batched_dims = {}, const int& batch_size = 1);
-		void setup2(const std::string& onnx_path, const Ort::SessionOptions& session_options);
+			void setup(const std::string& onnx_path, const BaseSetting& base_setting = BaseSetting{ INFER_CPU, 0, FLOAT32, FLOAT32 }, const int& batch_size = 1, const bool debug = false, const bool timestamp = false);
+			void setup2(const std::string& onnx_path, const Ort::SessionOptions& session_options);
+			void setNames();
+			void setInputs(std::vector<ofImage*>& input_imgs);
+			void convertImageToMatInt32(ofImage* img, std::vector<int32_t>& values, size_t& idx);
+			void convertImageToMatFloat(ofImage* img, std::vector<float>& values, size_t& idx);
+			float* run();

-		std::vector<std::vector<float>>* getInputTensorData() {
-			return &this->input_values_handler;
-		}
+			// Utilities ╰（‵□′）╯
+			std::string PrintShape(const std::vector<int64_t>& v);
+			Ort::Value GenerateTensor(int batch_size);
+			int CalculateProduct(const std::vector<int64_t>& v);
+			Ort::Value VectorToTensor(std::vector<float>& data, const std::vector<int64_t>& shape);
 			
-		std::vector<Ort::Value>& run();
+		protected:
+			bool debug = false;
+			bool timestamp = false;
+			Ort::Env ort_env;
+			std::shared_ptr<Ort::Session> ort_session;

-		// Utilities
-		std::string PrintShape(const std::vector<int64_t>& v);
-		Ort::Value GenerateTensor(int batch_size);
-		int CalculateProduct(const std::vector<int64_t>& v);
-		Ort::Value VectorToTensor(std::vector<float>& data, const std::vector<int64_t>& shape);
+			std::vector<std::string> input_node_names;
+			std::vector<int64_t> input_node_dims; // 1 input only.

-	protected:
-		Ort::Env ort_env;
-		std::shared_ptr<Ort::Session> ort_session;
+			Ort::MemoryInfo memory_info_handler = Ort::MemoryInfo::CreateCpu(OrtArenaAllocator, OrtMemTypeDefault);

-		std::vector<std::string> input_node_names;
-		std::vector<int64_t> input_node_dims; // 1 input only.
+			std::vector<std::string> output_node_names;
+			std::vector<std::vector<int64_t>> output_node_dims; // >=1 outputs
+			std::vector<Ort::Value> output_values;

-		Ort::MemoryInfo memory_info_handler = Ort::MemoryInfo::CreateCpu(OrtArenaAllocator, OrtMemTypeDefault);
+			Ort::Value dummy_tensor{ nullptr };
+			std::vector<Ort::Value> dummy_output_tensor;

-		std::vector<std::string> output_node_names;
-		std::vector<std::vector<int64_t>> output_node_dims; // >=1 outputs
-		std::vector<Ort::Value> output_values;
+			std::vector<std::vector<float>> input_values_handler;

-		Ort::Value dummy_tensor{ nullptr };
-		std::vector<Ort::Value> dummy_output_tensor;
+			size_t input_node_size = 1;
+			std::vector<int64_t> batched_dims;
+			int batch_size;
+			int num_outputs = 1;

-		std::vector<std::vector<float>> input_values_handler;
+			std::vector<ofImage*> input_imgs;
+			cv::Mat image_array;

-		size_t input_node_size = 1;
-		std::vector<int64_t> batched_dims;
-		int batch_size;
-		int num_outputs = 1;
+			ModelDataType input_dtype;
+			ModelDataType output_dtype;
 	};
 }
--- a/temp.cpp
+++ b/temp.cpp
@ -0,0 +1,297 @@
+#include "ofxOnnxRuntime.h"
+
+namespace ofxOnnxRuntime
+{
+#ifdef _MSC_VER
+	static std::wstring to_wstring(const std::string &str)
+	{
+		unsigned len = str.size() * 2;
+		setlocale(LC_CTYPE, "");
+		wchar_t *p = new wchar_t[len];
+		mbstowcs(p, str.c_str(), len);
+		std::wstring wstr(p);
+		delete[] p;
+		return wstr;
+	}
+#endif
+	void BaseHandler::setup(const std::string & onnx_path, const BaseSetting & base_setting, const int & batch_size, const bool debug, const bool timestamp)
+	{
+		// Store data types
+		this->input_dtype = base_setting.input_dtype;
+		this->output_dtype = base_setting.output_dtype;
+
+		Ort::SessionOptions session_options;
+		session_options.SetIntraOpNumThreads(1);
+		session_options.SetIntraOpNumThreads(1);
+		session_options.SetGraphOptimizationLevel(GraphOptimizationLevel::ORT_ENABLE_ALL);
+
+		if (base_setting.infer_type == INFER_CUDA) {
+			OrtCUDAProviderOptions opts;
+			opts.device_id = 0;
+			opts.cudnn_conv_algo_search = OrtCudnnConvAlgoSearchExhaustive;
+			opts.do_copy_in_default_stream = 0;
+			opts.arena_extend_strategy = 0;
+			session_options.AppendExecutionProvider_CUDA(opts);
+		}
+
+		this->timestamp = timestamp;
+		this->debug = debug;
+		this->batch_size = batch_size;
+		this->setup2(onnx_path, session_options);
+	}
+
+	void BaseHandler::setup2(const std::string & onnx_path, const Ort::SessionOptions & session_options)
+	{
+		std::string path = ofToDataPath(onnx_path, true);
+
+		std::wstring wpath(path.begin(), path.end());  // basic conversion
+
+		ort_session = std::make_shared<Ort::Session>(ort_env, wpath.c_str(), session_options);
+
+		setNames();
+	}
+
+	void BaseHandler::setNames()
+	{
+		Ort::AllocatorWithDefaultOptions allocator;
+
+		// 1. Gets Input Name/s & Shape ([1, 3, 28, 28]) -- In most cases this is usually just one
+		for (std::size_t i = 0; i < ort_session->GetInputCount(); i++) {
+			input_node_names.emplace_back(ort_session->GetInputNameAllocated(i, allocator).get());
+			input_node_dims = ort_session->GetInputTypeInfo(i).GetTensorTypeAndShapeInfo().GetShape();
+
+			// Some models might have negative shape values to indicate dynamic shape, e.g., for variable batch size. (?, 3, 28, 28) -> (1, 3, 28, 28)
+			for (auto& s : input_node_dims) if (s < 0) s = batch_size;
+
+			if (debug) std::cout << input_node_names.at(i) << " : " << PrintShape(input_node_dims) << std::endl;
+		}
+
+		// 2. Calculate the product of the dimensions
+		for (auto& f : input_node_dims) {
+			input_node_size *= f;
+		}
+
+		if (debug)  ofLog() << ofToString(input_node_size) + ", Batch Size:" + ofToString(input_node_dims[0]);
+
+		// 2. Clear up output values
+		output_node_dims.clear();
+		output_values.clear();
+		
+		// 3. Gets Output name/s & Shapes
+		for (std::size_t i = 0; i < ort_session->GetOutputCount(); i++) {
+			output_node_names.emplace_back(ort_session->GetOutputNameAllocated(i, allocator).get());
+			auto output_shapes = ort_session->GetOutputTypeInfo(i).GetTensorTypeAndShapeInfo().GetShape();
+			
+			output_values.emplace_back(nullptr);
+
+			if (debug) std::cout << output_node_names.at(i) << " : " << PrintShape(output_shapes) << std::endl;
+		}
+	}
+
+	float* BaseHandler::run()
+	{
+		
+		auto start = std::chrono::high_resolution_clock::now(); // starting timestamp
+
+		std::vector<Ort::Value> input_tensors;
+
+		size_t num_images = input_imgs.size();
+
+		if(input_imgs.size() != batch_size) {
+			ofLog() << "Input images do not match batch size. Inference FAILED.";
+			return dummy_output_tensor.front().GetTensorMutableData<float>();
+		}
+
+		// transform std::string -> const char*
+		std::vector<const char*> input_names_char(input_node_names.size(), nullptr);
+		std::transform(std::begin(input_node_names), std::end(input_node_names), std::begin(input_names_char),
+			[&](const std::string& str) { return str.c_str(); });
+
+		std::vector<const char*> output_names_char(output_node_names.size(), nullptr);
+		std::transform(std::begin(output_node_names), std::end(output_node_names), std::begin(output_names_char),
+			[&](const std::string& str) { return str.c_str(); });
+
+		std::vector<float> batch_values_f;
+		std::vector<int32_t> batch_values_int32;
+		batch_values_f.reserve(input_node_size * batch_size); // Reserve space but don't initialize
+		batch_values_int32.reserve(input_node_size * batch_size); // Reserve space but don't initialize
+
+
+		if (input_dtype == ModelDataType::FLOAT32){
+			// I have a list of imgs, these need to be converted from images into input for the model (int or float)
+			for(size_t i = 0; i < batch_size; i++) {
+				convertImageToMatFloat(input_imgs[i], batch_values_f, i);
+			}
+
+			// 2. Create tensor with batch values { input data, input size, model input dims, model input size}
+			input_tensors.emplace_back(Ort::Value::CreateTensor<float>(
+				memory_info_handler, batch_values_f.data(), input_node_size,
+				input_node_dims.data(), input_node_dims.size()));
+		} 
+		else if (input_dtype == ModelDataType::INT32) {
+			// I have a list of imgs, these need to be converted from images into input for the model (int or float)
+			for(size_t i = 0; i < batch_size; i++) {
+				convertImageToMatInt32(input_imgs[i], batch_values_int32, i);
+			}
+
+			// 2. Create tensor with batch values { input data, input size, model input dims, model input size}
+			input_tensors.emplace_back(Ort::Value::CreateTensor<int32_t>(
+			memory_info_handler, batch_values_int32.data(), input_node_size,
+			input_node_dims.data(), input_node_dims.size()));
+		}
+
+		
+		
+
+		try {
+			// 3. Run inference, { in names, input data, num of inputs, output names, num of outputs }
+			ofLog() << "run";
+			output_values = ort_session->Run(Ort::RunOptions{ nullptr }, 
+				input_names_char.data(), input_tensors.data(),
+				input_names_char.size(), output_names_char.data(), 
+				output_names_char.size());
+			ofLog() << "ran";
+			
+			if (debug) {
+				// Gets the address of the first value
+				auto& out = output_values.front();
+				// Get tensor shape information
+				Ort::TensorTypeAndShapeInfo info = out.GetTensorTypeAndShapeInfo();
+				std::vector<int64_t> output_dims = info.GetShape();
+				
+				// Print the dimensions
+				std::cout << "Output tensor dimensions: [";
+				for (size_t i = 0; i < output_dims.size(); i++) {
+					std::cout << output_dims[i];
+					if (i < output_dims.size() - 1) {
+						std::cout << ", ";
+					}
+				}
+				std::cout << "]" << std::endl;
+				
+				// Optional: Print total number of elements
+				size_t total_elements = 1;
+				for (auto& dim : output_dims) {
+					if (dim > 0) {  // Handle dynamic dimensions
+						total_elements *= static_cast<size_t>(dim);
+					}
+				}
+				std::cout << "Total elements: " << total_elements << std::endl;
+			}
+			
+			// if (timestamp) {
+			// 	auto end = std::chrono::high_resolution_clock::now();
+			// 	std::chrono::duration<double, std::milli> elapsed = end - start;
+			// 	std::cout << "Update loop took " << elapsed.count() << " ms" << std::endl;
+			// }
+
+			return output_values.front().GetTensorMutableData<float>();
+
+		} catch (const Ort::Exception& ex) {
+			std::cout << "ERROR running model inference: " << ex.what() << std::endl;
+			return dummy_output_tensor.front().GetTensorMutableData<float>();
+		}
+		
+	}
+
+	/*
+	*
+	*	Utilties (｡･∀･)ﾉﾞ
+	*
+	*/
+
+	// Add separate methods for float and int32 conversion
+    void BaseHandler::convertImageToMatFloat(ofImage* img, std::vector<float>& values, size_t& idx) {
+        // Your existing conversion code for float
+        ofPixels& pix = img->getPixels();
+        int width = img->getWidth();
+        int height = img->getHeight();
+        int channels = pix.getNumChannels();
+
+        cv::Mat cvImage = cv::Mat(height, width, (channels == 3) ? CV_8UC3 : CV_8UC1, pix.getData());
+        cv::InputArray inputArray(cvImage);
+        image_array = cv::dnn::blobFromImage(inputArray, 1 / 255.0, cv::Size(input_node_dims[2], input_node_dims[3]), (0, 0, 0), false, false);
+
+        std::memcpy(
+            values.data() + idx * channels * width * height,
+            image_array.data,
+            channels * width * height * sizeof(float)
+        );
+    }
+
+    void BaseHandler::convertImageToMatInt32(ofImage* img, std::vector<int32_t>& values, size_t& idx) {
+        // New conversion code for int32
+        ofPixels& pix = img->getPixels();
+        int width = img->getWidth();
+        int height = img->getHeight();
+        int channels = pix.getNumChannels();
+        
+        cv::Mat cvImage = cv::Mat(height, width, (channels == 3) ? CV_8UC3 : CV_8UC1, pix.getData());
+        cv::InputArray inputArray(cvImage);
+        cv::Mat intMat = cv::dnn::blobFromImage(inputArray, 1 / 255.0, cv::Size(height, width), (0, 0, 0), false, false);
+
+        intMat.convertTo(image_array, CV_32S);
+
+        std::memcpy(
+            values.data() + idx * channels * width * height,
+            image_array.data,
+            channels * width * height * sizeof(int32_t)
+        );
+    }
+
+	void BaseHandler::setInputs(std::vector<ofImage*>& in) {
+		this->input_imgs = in;
+	}
+
+	// Prints the shape of the given tensor (ex. input: (1, 1, 512, 512))
+	std::string BaseHandler::PrintShape(const std::vector<int64_t>& v) {
+		std::stringstream ss;
+		for (std::size_t i = 0; i < v.size() - 1; i++) ss << v[i] << "x";
+		ss << v[v.size() - 1];
+		return ss.str();
+	}
+
+	Ort::Value BaseHandler::GenerateTensor(int batch_size) {
+		// Random number generation setup
+		std::random_device rd;
+		std::mt19937 gen(rd());
+		std::uniform_real_distribution<float> dis(0.0f, 255.0f); // Random values between 0 and 255
+
+		// Calculate the total number of elements for a single tensor (without batch dimension) {?, 8} -> 8
+		int tensor_size = CalculateProduct(input_node_dims);
+
+		// Create a vector to hold all the values for the batch (8 * (4)batch_size) -> 32
+		std::vector<float> batch_values(batch_size * tensor_size); 
+
+		// Fill the batch with random values
+		std::generate(batch_values.begin(), batch_values.end(), [&]() {
+			return dis(gen);
+		});
+
+		// Fill the batch with random values
+		std::generate(batch_values.begin(), batch_values.end(), [&]() {
+			return dis(gen);
+		});
+
+		// Create the batched dimensions by inserting the batch size at the beginning of the original dimensions
+		std::vector<int64_t> batched_dims = {  };  // Start with batch size
+		batched_dims.insert(batched_dims.end(), input_node_dims.begin(), input_node_dims.end()); // Add the remaining dimensions
+		batched_dims[0] = batch_size;
+
+		return VectorToTensor(batch_values, batched_dims);
+	}
+
+	int BaseHandler::CalculateProduct(const std::vector<int64_t>& v) {
+		int total = 1;
+		for (auto& i : v) total *= i;
+		return total;
+	}
+
+	Ort::Value BaseHandler::VectorToTensor(std::vector<float>& data, const std::vector<int64_t>& shape) {
+		// Create a tensor from the provided data, shape, and memory info
+		auto tensor = Ort::Value::CreateTensor<float>(memory_info_handler, data.data(), data.size(), shape.data(), shape.size());
+
+		// Return the created tensor
+		return tensor;
+	}
+}
Author	SHA1	Message	Date
cailean	302f2f6e97	updated runtime to work with in32 & float input	2 months ago
cailean	091374af67	working	2 months ago