microsoft · snnn · Aug 25, 2023 · May 23, 2023 · May 23, 2023 · May 23, 2023
diff --git a/cmake/onnxruntime_nodejs.cmake b/cmake/onnxruntime_nodejs.cmake
@@ -60,6 +60,20 @@ else()
     endif()
 endif()
 
+# setup providers
+if (onnxruntime_USE_CUDA)
+    set(NODEJS_BINDING_USE_CUDA "--use_cuda")
+endif()
+if (onnxruntime_USE_DML)
+    set(NODEJS_BINDING_USE_DML "--use_dml")
+endif()
+if (onnxruntime_USE_TENSORRT)
+    set(NODEJS_BINDING_USE_TENSORRT "--use_tensorrt")
+endif()
+if (onnxruntime_USE_COREML)
+    set(NODEJS_BINDING_USE_COREML "--use_coreml")
+endif()
+
 if(NOT onnxruntime_ENABLE_STATIC_ANALYSIS)
 # add custom target
 add_custom_target(js_npm_ci ALL
@@ -74,7 +88,9 @@ add_custom_target(js_common_npm_ci ALL
 
 add_custom_target(nodejs_binding_wrapper ALL
     COMMAND ${NPM_CLI} ci
-    COMMAND ${NPM_CLI} run build -- --onnxruntime-build-dir=${CMAKE_CURRENT_BINARY_DIR} --config=${CMAKE_BUILD_TYPE} --arch=${NODEJS_BINDING_ARCH}
+    COMMAND ${NPM_CLI} run build -- --onnxruntime-build-dir=${CMAKE_CURRENT_BINARY_DIR} --config=${CMAKE_BUILD_TYPE}
+        --arch=${NODEJS_BINDING_ARCH} ${NODEJS_BINDING_USE_CUDA} ${NODEJS_BINDING_USE_DML} ${NODEJS_BINDING_USE_TENSORRT}
+        ${NODEJS_BINDING_USE_COREML}
     WORKING_DIRECTORY ${JS_NODE_ROOT}
     COMMENT "Using cmake-js to build OnnxRuntime Node.js binding")
 

diff --git a/js/common/lib/inference-session.ts b/js/common/lib/inference-session.ts
@@ -170,12 +170,14 @@ export declare namespace InferenceSession {
   // Backend React Native: supports 'cpu', 'xnnpack', 'coreml' (iOS), 'nnapi' (Android).
   interface ExecutionProviderOptionMap {
     cpu: CpuExecutionProviderOption;
+    coreml: CoreMlExecutionProviderOption;
     cuda: CudaExecutionProviderOption;
+    dml: DmlExecutionProviderOption;
+    tensorrt: TensorRtExecutionProviderOption;
     wasm: WebAssemblyExecutionProviderOption;
     webgl: WebGLExecutionProviderOption;
     xnnpack: XnnpackExecutionProviderOption;
     webnn: WebNNExecutionProviderOption;
-    coreml: CoreMLExecutionProviderOption;
     nnapi: NnapiExecutionProviderOption;
   }
 
@@ -194,6 +196,18 @@ export declare namespace InferenceSession {
     readonly name: 'cuda';
     deviceId?: number;
   }
+  export interface CoreMlExecutionProviderOption extends ExecutionProviderOption {
+    readonly name: 'coreml';
+    coreMlFlags?: number;
+  }
+  export interface DmlExecutionProviderOption extends ExecutionProviderOption {
+    readonly name: 'dml';
+    deviceId?: number;
+  }
+  export interface TensorRtExecutionProviderOption extends ExecutionProviderOption {
+    readonly name: 'tensorrt';
+    deviceId?: number;
+  }
   export interface WebAssemblyExecutionProviderOption extends ExecutionProviderOption {
     readonly name: 'wasm';
   }

diff --git a/js/node/CMakeLists.txt b/js/node/CMakeLists.txt
@@ -28,8 +28,29 @@ endif()
 # include dirs
 include_directories(${CMAKE_JS_INC})
 include_directories(${CMAKE_SOURCE_DIR}/../../include/onnxruntime/core/session)
+include_directories(${CMAKE_SOURCE_DIR}/../../include/onnxruntime)
+include_directories(${CMAKE_SOURCE_DIR}/../../onnxruntime)
 include_directories(${CMAKE_SOURCE_DIR}/node_modules/node-addon-api)
 
+# optional providers
+option(USE_DML "Build with DirectML support" OFF)
+option(USE_CUDA "Build with CUDA support" OFF)
+option(USE_TENSORRT "Build with TensorRT support" OFF)
+option(USE_COREML "Build with CoreML support" OFF)
+
+if(USE_DML)
+  add_compile_definitions(USE_DML=1)
+endif()
+if(USE_CUDA)
+  add_compile_definitions(USE_CUDA=1)
+endif()
+if(USE_TENSORRT)
+  add_compile_definitions(USE_TENSORRT=1)
+endif()
+if(USE_COREML)
+  add_compile_definitions(USE_COREML=1)
+endif()
+
 # source files
 file(GLOB ORT_NODEJS_BINDING_SOURCE_FILES ${CMAKE_SOURCE_DIR}/src/*.cc)
 
@@ -77,6 +98,14 @@ if (WIN32)
       ${ONNXRUNTIME_BUILD_DIR}/${CMAKE_BUILD_TYPE}/onnxruntime.dll
       ${dist_folder}
   )
+  if (USE_DML)
+    add_custom_command(
+      TARGET onnxruntime_binding POST_BUILD
+      COMMAND ${CMAKE_COMMAND} -E copy
+      ${ONNXRUNTIME_BUILD_DIR}/${CMAKE_BUILD_TYPE}/DirectML.dll
+      ${dist_folder}
+    )
+  endif ()
   if (CMAKE_BUILD_TYPE STREQUAL "Debug")
     add_custom_command(
       TARGET onnxruntime_binding POST_BUILD

diff --git a/js/node/README.md b/js/node/README.md
@@ -24,6 +24,10 @@ Following platforms are supported with pre-built binaries:
 
 To use on platforms without pre-built binaries, you can build Node.js binding from source and consume it by `npm install <onnxruntime_repo_root>/js/node/`. See also [instructions](https://www.onnxruntime.ai/docs/how-to/build.html#apis-and-language-bindings) for building ONNX Runtime Node.js binding locally.
 
+# GPU Support
+
+Right now, the Windows version supports only the DML provider. Linux x64 can use CUDA and TensorRT.
+
 ## License
 
 License information can be found [here](https://github.com/microsoft/onnxruntime/blob/main/README.md#license).
diff --git a/js/node/lib/backend.ts b/js/node/lib/backend.ts
@@ -69,3 +69,4 @@ class OnnxruntimeBackend implements Backend {
 }
 
 export const onnxruntimeBackend = new OnnxruntimeBackend();
+export const listSupportedBackends = binding.listSupportedBackends;
diff --git a/js/node/lib/binding.ts b/js/node/lib/binding.ts
@@ -33,11 +33,18 @@ export declare namespace Binding {
   export interface InferenceSessionConstructor {
     new(): InferenceSession;
   }
+
+  export interface SupportedBackend {
+    name: string;
+    bundled: boolean;
+  }
 }
 
 // export native binding
 export const binding =
     // eslint-disable-next-line @typescript-eslint/no-require-imports, @typescript-eslint/no-var-requires
-    require(`../bin/napi-v3/${process.platform}/${process.arch}/onnxruntime_binding.node`) as
-    // eslint-disable-next-line @typescript-eslint/naming-convention
-    {InferenceSession: Binding.InferenceSessionConstructor};
+    require(`../bin/napi-v3/${process.platform}/${process.arch}/onnxruntime_binding.node`) as {
+  // eslint-disable-next-line @typescript-eslint/naming-convention
+  InferenceSession: Binding.InferenceSessionConstructor;
+  listSupportedBackends: () => Binding.SupportedBackend[];
+};
diff --git a/js/node/lib/index.ts b/js/node/lib/index.ts
@@ -2,10 +2,14 @@
 // Licensed under the MIT License.
 
 export * from 'onnxruntime-common';
+export {listSupportedBackends} from './backend';
 import {registerBackend, env} from 'onnxruntime-common';
-import {onnxruntimeBackend} from './backend';
 import {version} from './version';
+import {onnxruntimeBackend, listSupportedBackends} from './backend';
 
-registerBackend('cpu', onnxruntimeBackend, 100);
+const backends = listSupportedBackends();
+for (const backend of backends) {
+  registerBackend(backend.name, onnxruntimeBackend, 100);
+}
 
 env.versions.node = version;
diff --git a/js/node/script/build.ts b/js/node/script/build.ts
@@ -25,6 +25,14 @@ if (ARCH !== 'x64' && ARCH !== 'ia32' && ARCH !== 'arm64' && ARCH !== 'arm') {
 const ONNXRUNTIME_BUILD_DIR = buildArgs['onnxruntime-build-dir'];
 // --rebuild
 const REBUILD = !!buildArgs.rebuild;
+// --use_dml
+const USE_DML = !!buildArgs.use_dml;
+// --use_cuda
+const USE_CUDA = !!buildArgs.use_cuda;
+// --use_tensorrt
+const USE_TENSORRT = !!buildArgs.use_tensorrt;
+// --use_coreml
+const USE_COREML = !!buildArgs.use_coreml;
 
 // build path
 const ROOT_FOLDER = path.join(__dirname, '..');
@@ -47,6 +55,18 @@ const args = [
 if (ONNXRUNTIME_BUILD_DIR && typeof ONNXRUNTIME_BUILD_DIR === 'string') {
   args.push(`--CDONNXRUNTIME_BUILD_DIR=${ONNXRUNTIME_BUILD_DIR}`);
 }
+if (USE_DML) {
+  args.push('--CDUSE_DML=ON');
+}
+if (USE_CUDA) {
+  args.push('--CDUSE_CUDA=ON');
+}
+if (USE_TENSORRT) {
+  args.push('--CDUSE_TENSORRT=ON');
+}
+if (USE_COREML) {
+  args.push('--CDUSE_COREML=ON');
+}
 
 // set CMAKE_OSX_ARCHITECTURES for macOS build
 if (os.platform() === 'darwin') {

diff --git a/js/node/src/directml_load_helper.cc b/js/node/src/directml_load_helper.cc
@@ -0,0 +1,37 @@
+// Copyright (c) Microsoft Corporation. All rights reserved.
+// Licensed under the MIT License.
+
+#ifdef _WIN32
+#include "common.h"
+#include "windows.h"
+
+void LoadDirectMLDll(Napi::Env env) {
+  DWORD pathLen = MAX_PATH;
+  std::wstring path(pathLen, L'\0');
+  HMODULE moduleHandle = nullptr;
+
+  GetModuleHandleEx(GET_MODULE_HANDLE_EX_FLAG_FROM_ADDRESS | GET_MODULE_HANDLE_EX_FLAG_UNCHANGED_REFCOUNT,
+                    reinterpret_cast<LPCSTR>(&LoadDirectMLDll), &moduleHandle);
+
+  DWORD getModuleFileNameResult = GetModuleFileNameW(moduleHandle, const_cast<wchar_t *>(path.c_str()), pathLen);
+  while (getModuleFileNameResult == 0 || getModuleFileNameResult == pathLen) {
+    int ret = GetLastError();
+    if (ret == ERROR_INSUFFICIENT_BUFFER && pathLen < 32768) {
+      pathLen *= 2;
+      path.resize(pathLen);
+      getModuleFileNameResult = GetModuleFileNameW(moduleHandle, const_cast<wchar_t *>(path.c_str()), pathLen);
+    } else {
+      ORT_NAPI_THROW_ERROR(env, "Failed getting path to load DirectML.dll, error code: ", ret);
+    }
+  }
+
+  path.resize(path.rfind(L'\\') + 1);
+  path.append(L"DirectML.dll");
+  HMODULE libraryLoadResult = LoadLibraryW(path.c_str());
+
+  if (!libraryLoadResult) {
+    int ret = GetLastError();
+    ORT_NAPI_THROW_ERROR(env, "Failed loading bundled DirectML.dll, error code: ", ret);
+  }
+}
+#endif
diff --git a/js/node/src/directml_load_helper.h b/js/node/src/directml_load_helper.h
@@ -0,0 +1,6 @@
+// Copyright (c) Microsoft Corporation. All rights reserved.
+// Licensed under the MIT License.
+
+#if defined(USE_DML) && defined(_WIN32)
+void LoadDirectMLDll(Napi::Env env);
+#endif
diff --git a/js/node/src/inference_session_wrap.cc b/js/node/src/inference_session_wrap.cc
@@ -4,14 +4,19 @@
 #include "onnxruntime_cxx_api.h"
 
 #include "common.h"
+#include "directml_load_helper.h"
 #include "inference_session_wrap.h"
 #include "run_options_helper.h"
 #include "session_options_helper.h"
 #include "tensor_helper.h"
+#include <string>
 
 Napi::FunctionReference InferenceSessionWrap::constructor;
 
 Napi::Object InferenceSessionWrap::Init(Napi::Env env, Napi::Object exports) {
+#if defined(USE_DML) && defined(_WIN32)
+  LoadDirectMLDll(env);
+#endif
   // create ONNX runtime env
   Ort::InitApi();
   ORT_NAPI_THROW_ERROR_IF(
@@ -32,6 +37,10 @@ Napi::Object InferenceSessionWrap::Init(Napi::Env env, Napi::Object exports) {
   constructor = Napi::Persistent(func);
   constructor.SuppressDestruct();
   exports.Set("InferenceSession", func);
+
+  Napi::Function listSupportedBackends = Napi::Function::New(env, InferenceSessionWrap::ListSupportedBackends);
+  exports.Set("listSupportedBackends", listSupportedBackends);
+
   return exports;
 }
 
@@ -70,7 +79,7 @@ Napi::Value InferenceSessionWrap::LoadModel(const Napi::CallbackInfo &info) {
       int64_t bytesOffset = info[1].As<Napi::Number>().Int64Value();
       int64_t bytesLength = info[2].As<Napi::Number>().Int64Value();
 
-      ParseSessionOptions(info[1].As<Napi::Object>(), sessionOptions);
+      ParseSessionOptions(info[3].As<Napi::Object>(), sessionOptions);
       this->session_.reset(new Ort::Session(*env.GetInstanceData<Ort::Env>(),
                                             reinterpret_cast<char *>(buffer) + bytesOffset, bytesLength,
                                             sessionOptions));
@@ -154,14 +163,15 @@ Napi::Value InferenceSessionWrap::Run(const Napi::CallbackInfo &info) {
   std::vector<bool> reuseOutput;
   size_t inputIndex = 0;
   size_t outputIndex = 0;
+  OrtMemoryInfo *memory_info = Ort::MemoryInfo::CreateCpu(OrtArenaAllocator, OrtMemTypeDefault).release();
 
   try {
     for (auto &name : inputNames_) {
       if (feed.Has(name)) {
         inputIndex++;
         inputNames_cstr.push_back(name.c_str());
         auto value = feed.Get(name);
-        inputValues.push_back(NapiValueToOrtValue(env, value));
+        inputValues.push_back(NapiValueToOrtValue(env, value, memory_info));
       }
     }
     for (auto &name : outputNames_) {
@@ -170,7 +180,7 @@ Napi::Value InferenceSessionWrap::Run(const Napi::CallbackInfo &info) {
         outputNames_cstr.push_back(name.c_str());
         auto value = fetch.Get(name);
         reuseOutput.push_back(!value.IsNull());
-        outputValues.emplace_back(value.IsNull() ? Ort::Value{nullptr} : NapiValueToOrtValue(env, value));
+        outputValues.emplace_back(value.IsNull() ? Ort::Value{nullptr} : NapiValueToOrtValue(env, value, memory_info));
       }
     }
 
@@ -198,3 +208,33 @@ Napi::Value InferenceSessionWrap::Run(const Napi::CallbackInfo &info) {
     ORT_NAPI_THROW_ERROR(env, e.what());
   }
 }
+
+Napi::Value InferenceSessionWrap::ListSupportedBackends(const Napi::CallbackInfo &info) {
+  Napi::Env env = info.Env();
+  Napi::EscapableHandleScope scope(env);
+  Napi::Array result = Napi::Array::New(env);
+
+  auto createObject = [&env](const std::string &name, const bool bundled) -> Napi::Object {
+    Napi::Object result = Napi::Object::New(env);
+    result.Set("name", name);
+    result.Set("bundled", bundled);
+    return result;
+  };
+
+  result.Set(uint32_t(0), createObject("cpu", true));
+
+#ifdef USE_DML
+  result.Set(result.Length(), createObject("dml", true));
+#endif
+#ifdef USE_CUDA
+  result.Set(result.Length(), createObject("cuda", false));
+#endif
+#ifdef USE_TENSORRT
+  result.Set(result.Length(), createObject("tensorrt", false));
+#endif
+#ifdef USE_COREML
+  result.Set(result.Length(), createObject("coreml", true));
+#endif
+
+  return scope.Escape(result);
+}
diff --git a/js/node/src/inference_session_wrap.h b/js/node/src/inference_session_wrap.h
@@ -15,6 +15,12 @@ class InferenceSessionWrap : public Napi::ObjectWrap<InferenceSessionWrap> {
   InferenceSessionWrap(const Napi::CallbackInfo &info);
 
 private:
+  /**
+   * [sync] list supported backend list
+   * @returns array with objects { "name": "cpu", requirementsInstalled: true }
+   */
+  static Napi::Value ListSupportedBackends(const Napi::CallbackInfo &info);
+
   /**
    * [sync] create the session.
    * @param arg0 either a string (file path) or a Uint8Array
Original file line number	Diff line number	Diff line change
Expand Up		@@ -69,3 +69,4 @@ class OnnxruntimeBackend implements Backend {
		}

		export const onnxruntimeBackend = new OnnxruntimeBackend();
		export const listSupportedBackends = binding.listSupportedBackends;