ort v2.0.0-rc.1ベースに切り替える

VOICEVOX · Apr 28, 2024 · fc968d1 · fc968d1
1 parent b147977
commit fc968d1
Show file tree

Hide file tree

Showing 4 changed files with 50 additions and 60 deletions.
diff --git a/Cargo.lock b/Cargo.lock
diff --git a/Cargo.toml b/Cargo.toml
@@ -88,7 +88,7 @@ zip = "0.6.3"
 
 [workspace.dependencies.voicevox-ort]
 git = "https://github.com/qryxip/ort.git"
-rev = "37af007322f0dd5a21e536ab3bcf727970f1283a"
+rev = "59e94ac87732e9da3f83ebbd542a3062f3cf2264"
 
 [workspace.dependencies.open_jtalk]
 git = "https://github.com/VOICEVOX/open_jtalk-rs.git"

diff --git a/crates/voicevox_core/src/infer.rs b/crates/voicevox_core/src/infer.rs
@@ -79,6 +79,7 @@ pub(crate) trait InferenceInputSignature: Send + 'static {
 pub(crate) trait InputScalar: Sized {
     const KIND: InputScalarKind;
 
+    // TODO: `Array`ではなく`ArrayView`を取ることができるかもしれない
     fn push_tensor_to_ctx(
         tensor: Array<Self, impl Dimension + 'static>,
         visitor: &mut impl PushInputTensor,

diff --git a/crates/voicevox_core/src/infer/runtimes/onnxruntime.rs b/crates/voicevox_core/src/infer/runtimes/onnxruntime.rs
@@ -8,7 +8,6 @@ use ort::{
     ExecutionProviderDispatch, GraphOptimizationLevel, IntoTensorElementType, TensorElementType,
     ValueType,
 };
-use tracing::warn;
 
 use crate::{devices::SupportedDevices, error::ErrorRepr};
 
@@ -56,17 +55,9 @@ impl InferenceRuntime for Onnxruntime {
         // TODO: `InferenceRuntime::init`と`InitInferenceRuntimeError`を作る
         build_ort_env_once().unwrap();
 
-        let cpu_num_threads = options.cpu_num_threads.try_into().unwrap_or_else(|_| {
-            warn!(
-                "`cpu_num_threads={}` is too large. Setting it to 32767",
-                options.cpu_num_threads,
-            );
-            i16::MAX
-        });
-
         let builder = ort::Session::builder()?
             .with_optimization_level(GraphOptimizationLevel::Level1)?
-            .with_intra_threads(cpu_num_threads)?;
+            .with_intra_threads(options.cpu_num_threads.into())?;
 
         let builder = if options.use_gpu && cfg!(feature = "directml") {
             builder
@@ -84,7 +75,7 @@ impl InferenceRuntime for Onnxruntime {
         };
 
         let model = model()?;
-        let sess = builder.with_model_from_memory(&{ model })?;
+        let sess = builder.commit_from_memory(&{ model })?;
 
         let input_param_infos = sess
             .inputs
@@ -187,8 +178,8 @@ impl InferenceRuntime for Onnxruntime {
 
                 match ty {
                     TensorElementType::Float32 => {
-                        let output = output.extract_tensor::<f32>()?;
-                        Ok(OutputTensor::Float32(output.view().clone().into_owned()))
+                        let output = output.try_extract_tensor::<f32>()?;
+                        Ok(OutputTensor::Float32(output.into_owned()))
                     }
                     _ => bail!("unexpected output tensor element data type"),
                 }
@@ -205,7 +196,7 @@ fn build_ort_env_once() -> ort::Result<()> {
 
 pub(crate) struct OnnxruntimeRunContext<'sess> {
     sess: &'sess ort::Session,
-    inputs: Vec<ort::Value>,
+    inputs: Vec<ort::SessionInputValue<'static>>,
 }
 
 impl OnnxruntimeRunContext<'_> {
@@ -216,7 +207,7 @@ impl OnnxruntimeRunContext<'_> {
             impl Dimension + 'static,
         >,
     ) -> anyhow::Result<()> {
-        let input = input.try_into()?;
+        let input = ort::Value::from_array(input)?.into();
         self.inputs.push(input);
         Ok(())
     }