diff --git a/Cargo.lock b/Cargo.lock index 338cdda43..2baa09fc0 100644 --- a/Cargo.lock +++ b/Cargo.lock @@ -117,7 +117,7 @@ source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "3fa490e751f3878eb9accb9f18988eca52c2337ce000a8bf31ef50d4c723ca9e" dependencies = [ "android_log-sys", - "env_logger 0.10.0", + "env_logger", "log", "once_cell", ] @@ -415,15 +415,13 @@ checksum = "8a32fd6af2b5827bce66c29053ba0e7c42b9dcab01835835058558c10851a46b" [[package]] name = "bindgen" -version = "0.60.1" +version = "0.62.0" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "062dddbc1ba4aca46de6338e2bf87771414c335f7b2f2036e8f3e9befebf88e6" +checksum = "c6720a8b7b2d39dd533285ed438d458f65b31b5c257e6ac7bb3d7e82844dd722" dependencies = [ "bitflags", "cexpr", "clang-sys", - "clap 3.2.22", - "env_logger 0.9.1", "lazy_static", "lazycell", "log", @@ -433,6 +431,7 @@ dependencies = [ "regex", "rustc-hash", "shlex", + "syn 1.0.102", "which", ] @@ -549,13 +548,10 @@ source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "c1db59621ec70f09c5e9b597b220c7a2b43611f4710dc03ceb8748637775692c" [[package]] -name = "castaway" -version = "0.2.2" +name = "camino" +version = "1.1.6" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "8a17ed5635fc8536268e5d4de1e22e81ac34419e5f052d4d51f4e01dcc263fcc" -dependencies = [ - "rustversion", -] +checksum = "c59e92b5a388f549b863a7bea62612c09f24c8393560709a54558a9abdfb3b9c" [[package]] name = "cbindgen" @@ -778,19 +774,6 @@ dependencies = [ "memchr", ] -[[package]] -name = "compact_str" -version = "0.7.1" -source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "f86b9c4c00838774a6d902ef931eff7470720c51d90c2e32cfe15dc304737b3f" -dependencies = [ - "castaway", - "cfg-if", - "itoa", - "ryu", - "static_assertions", -] - [[package]] name = "concolor" version = "0.0.11" @@ -938,12 +921,6 @@ dependencies = [ "cfg-if", ] -[[package]] -name = "crunchy" -version = "0.2.2" -source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "7a81dae078cea95a014a339291cec439d2f232ebe854a9d672b796c6afafa9b7" - [[package]] name = "crypto-common" version = "0.1.6" @@ -1303,19 +1280,6 @@ dependencies = [ "syn 2.0.38", ] -[[package]] -name = "env_logger" -version = "0.9.1" -source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "c90bf5f19754d10198ccb95b70664fc925bd1fc090a0fd9a6ebc54acc8cd6272" -dependencies = [ - "atty", - "humantime", - "log", - "regex", - "termcolor", -] - [[package]] name = "env_logger" version = "0.10.0" @@ -1662,16 +1626,6 @@ dependencies = [ "tracing", ] -[[package]] -name = "half" -version = "2.3.1" -source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "bc52e53916c08643f1b56ec082790d1e86a32e58dc5268f897f313fbae7b4872" -dependencies = [ - "cfg-if", - "crunchy", -] - [[package]] name = "hashbrown" version = "0.12.3" @@ -1828,12 +1782,6 @@ dependencies = [ "libm", ] -[[package]] -name = "humantime" -version = "2.1.0" -source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "9a3a5bfb195931eeb336b2a7b4d761daec841b97f947d34394601737a7bba5e4" - [[package]] name = "hyper" version = "0.14.23" @@ -2522,6 +2470,30 @@ version = "1.18.0" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "dd8b5dd2ae5ed71462c540258bedcb51965123ad7e7ccf4b9a8cafaa4a63576d" +[[package]] +name = "onnxruntime" +version = "0.1.0" +source = "git+https://github.com/VOICEVOX/onnxruntime-rs.git?rev=ebb9dcb9b26ee681889b52b6db3b4f642b04a250#ebb9dcb9b26ee681889b52b6db3b4f642b04a250" +dependencies = [ + "lazy_static", + "ndarray", + "onnxruntime-sys", + "thiserror", + "tracing", +] + +[[package]] +name = "onnxruntime-sys" +version = "0.0.25" +source = "git+https://github.com/VOICEVOX/onnxruntime-rs.git?rev=ebb9dcb9b26ee681889b52b6db3b4f642b04a250#ebb9dcb9b26ee681889b52b6db3b4f642b04a250" +dependencies = [ + "flate2", + "once_cell", + "tar", + "ureq", + "zip", +] + [[package]] name = "opaque-debug" version = "0.3.0" @@ -2531,8 +2503,9 @@ checksum = "624a8340c38c1b80fd549087862da4ba43e08858af025b236e509b6649fc13d5" [[package]] name = "open_jtalk" version = "0.1.25" -source = "git+https://github.com/VOICEVOX/open_jtalk-rs.git?rev=a16714ce16dec76fd0e3041a7acfa484921db3b5#a16714ce16dec76fd0e3041a7acfa484921db3b5" +source = "git+https://github.com/VOICEVOX/open_jtalk-rs.git?rev=70c76bb54522830e92803038191bf533ba68ce85#70c76bb54522830e92803038191bf533ba68ce85" dependencies = [ + "camino", "open_jtalk-sys", "thiserror", ] @@ -2540,7 +2513,7 @@ dependencies = [ [[package]] name = "open_jtalk-sys" version = "0.16.111" -source = "git+https://github.com/VOICEVOX/open_jtalk-rs.git?rev=a16714ce16dec76fd0e3041a7acfa484921db3b5#a16714ce16dec76fd0e3041a7acfa484921db3b5" +source = "git+https://github.com/VOICEVOX/open_jtalk-rs.git?rev=70c76bb54522830e92803038191bf533ba68ce85#70c76bb54522830e92803038191bf533ba68ce85" dependencies = [ "bindgen", "cmake", @@ -4288,6 +4261,7 @@ checksum = "b97acb4c28a254fd7a4aeec976c46a7fa404eac4d7c134b30c75144846d7cb8f" dependencies = [ "base64 0.13.0", "chunked_transfer", + "flate2", "log", "once_cell", "rustls", @@ -4352,36 +4326,13 @@ version = "0.9.4" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "49874b5167b65d7193b8aba1567f5c7d93d001cafc34600cee003eda787e483f" -[[package]] -name = "voicevox-ort" -version = "2.0.0-rc.0" -source = "git+https://github.com/qryxip/ort.git?rev=37af007322f0dd5a21e536ab3bcf727970f1283a#37af007322f0dd5a21e536ab3bcf727970f1283a" -dependencies = [ - "compact_str", - "half", - "ndarray", - "thiserror", - "tracing", - "voicevox-ort-sys", -] - -[[package]] -name = "voicevox-ort-sys" -version = "2.0.0-rc.0" -source = "git+https://github.com/qryxip/ort.git?rev=37af007322f0dd5a21e536ab3bcf727970f1283a#37af007322f0dd5a21e536ab3bcf727970f1283a" -dependencies = [ - "flate2", - "sha2 0.10.6", - "tar", - "ureq", -] - [[package]] name = "voicevox_core" version = "0.0.0" dependencies = [ "anyhow", "async_zip", + "camino", "derive-getters", "derive-new", "derive_more", @@ -4398,6 +4349,7 @@ dependencies = [ "nanoid", "ndarray", "once_cell", + "onnxruntime", "open_jtalk", "ouroboros", "pretty_assertions", @@ -4412,7 +4364,6 @@ dependencies = [ "tokio", "tracing", "uuid", - "voicevox-ort", "voicevox_core_macros", "windows", "zip", @@ -4426,6 +4377,7 @@ dependencies = [ "anstyle-query", "anyhow", "assert_cmd", + "camino", "chrono", "clap 4.0.10", "colorchoice", @@ -4489,6 +4441,7 @@ dependencies = [ name = "voicevox_core_python_api" version = "0.0.0" dependencies = [ + "camino", "easy-ext", "log", "pyo3", diff --git a/Cargo.toml b/Cargo.toml index b63840d26..e4e315514 100644 --- a/Cargo.toml +++ b/Cargo.toml @@ -12,6 +12,7 @@ async-std = "1.12.0" async_zip = "0.0.11" binstall-tar = "0.4.39" bytes = "1.1.0" +camino = "1.1.6" cbindgen = "0.24.3" chrono = { version = "0.4.26", default-features = false } clap = "4.0.10" @@ -87,7 +88,7 @@ rev = "37af007322f0dd5a21e536ab3bcf727970f1283a" [workspace.dependencies.open_jtalk] git = "https://github.com/VOICEVOX/open_jtalk-rs.git" -rev = "a16714ce16dec76fd0e3041a7acfa484921db3b5" +rev = "70c76bb54522830e92803038191bf533ba68ce85" # FIXME: iOS対応のpull request(https://github.com/wesleywiser/process_path/pull/16)がマージされる見込みが無いため [workspace.dependencies.process_path] diff --git a/crates/voicevox_core/Cargo.toml b/crates/voicevox_core/Cargo.toml index 06fd2f6a7..fab7e4956 100644 --- a/crates/voicevox_core/Cargo.toml +++ b/crates/voicevox_core/Cargo.toml @@ -12,6 +12,7 @@ directml = ["voicevox-ort/directml"] [dependencies] anyhow.workspace = true async_zip = { workspace = true, features = ["full"] } +camino.workspace = true derive-getters.workspace = true derive-new.workspace = true derive_more.workspace = true diff --git a/crates/voicevox_core/src/__internal/doctest_fixtures.rs b/crates/voicevox_core/src/__internal/doctest_fixtures.rs index a27478d98..426f6cd09 100644 --- a/crates/voicevox_core/src/__internal/doctest_fixtures.rs +++ b/crates/voicevox_core/src/__internal/doctest_fixtures.rs @@ -1,9 +1,9 @@ -use std::path::Path; +use camino::Utf8Path; use crate::{AccelerationMode, InitializeOptions}; pub async fn synthesizer_with_sample_voice_model( - open_jtalk_dic_dir: impl AsRef, + open_jtalk_dic_dir: impl AsRef, ) -> anyhow::Result> { let syntesizer = crate::tokio::Synthesizer::new( crate::tokio::OpenJtalk::new(open_jtalk_dic_dir).await?, diff --git a/crates/voicevox_core/src/engine/open_jtalk.rs b/crates/voicevox_core/src/engine/open_jtalk.rs index 6eee85708..7c272cb74 100644 --- a/crates/voicevox_core/src/engine/open_jtalk.rs +++ b/crates/voicevox_core/src/engine/open_jtalk.rs @@ -15,11 +15,11 @@ pub trait FullcontextExtractor: Clone + Send + Sync + 'static { pub(crate) mod blocking { use std::{ io::Write as _, - path::Path, sync::{Arc, Mutex}, }; - use anyhow::anyhow; + use anyhow::Context as _; + use camino::{Utf8Path, Utf8PathBuf}; use open_jtalk::{mecab_dict_index, text2mecab, JpCommon, ManagedResource, Mecab, Njd}; use tempfile::NamedTempFile; @@ -32,12 +32,8 @@ pub(crate) mod blocking { pub struct OpenJtalk(pub(super) Arc); impl self::OpenJtalk { - pub fn new(open_jtalk_dict_dir: impl AsRef) -> crate::result::Result { - let dict_dir = open_jtalk_dict_dir - .as_ref() - .to_str() - .unwrap_or_else(|| todo!()) // FIXME: `camino::Utf8Path`を要求するようにする - .to_owned(); + pub fn new(open_jtalk_dict_dir: impl AsRef) -> crate::result::Result { + let dict_dir = open_jtalk_dict_dir.as_ref().to_owned(); // FIXME: この`{}`はGitのdiffを抑えるためだけに存在 { @@ -47,11 +43,12 @@ pub(crate) mod blocking { jpcommon: ManagedResource::initialize(), }; - let result = resources.mecab.load(&*dict_dir); - if !result { - // FIXME: 「システム辞書を読もうとしたけど読めなかった」というエラーをちゃんと用意する - return Err(ErrorRepr::NotLoadedOpenjtalkDict.into()); - } + // FIXME: 「システム辞書を読もうとしたけど読めなかった」というエラーをちゃんと用意する + resources + .mecab + .load(&*dict_dir) + .inspect_err(|e| tracing::error!("{e:?}")) + .map_err(|_| ErrorRepr::NotLoadedOpenjtalkDict)?; Ok(Self(Arc::new(Inner { resources: Mutex::new(resources), @@ -124,7 +121,7 @@ pub(crate) mod blocking { pub(super) struct Inner { resources: std::sync::Mutex, - dict_dir: String, // FIXME: `camino::Utf8PathBuf`にする + dict_dir: Utf8PathBuf, } impl Inner { @@ -145,34 +142,37 @@ pub(crate) mod blocking { NamedTempFile::new().map_err(|e| ErrorRepr::UseUserDict(e.into()))?; let temp_dict_path = temp_dict.into_temp_path(); + // FIXME: `.unwrap()`ではなく、エラーとして回収する + let temp_csv_path = Utf8Path::from_path(temp_csv_path.as_ref()).unwrap(); + let temp_dict_path = Utf8Path::from_path(temp_dict_path.as_ref()).unwrap(); + // Mecabでユーザー辞書をコンパイル // TODO: エラー(SEGV)が出るパターンを把握し、それをRust側で防ぐ。 mecab_dict_index(&[ "mecab-dict-index", "-d", - &self.dict_dir, + self.dict_dir.as_ref(), "-u", - temp_dict_path.to_str().unwrap(), + temp_dict_path.as_ref(), "-f", "utf-8", "-t", "utf-8", - temp_csv_path.to_str().unwrap(), + temp_csv_path.as_ref(), "-q", ]); - self.load_with_userdic(Some(temp_dict_path.as_ref())) + self.load_with_userdic(Some(temp_dict_path)) } } - fn load_with_userdic(&self, dict_path: Option<&Path>) -> crate::result::Result<()> { + fn load_with_userdic(&self, dict_path: Option<&Utf8Path>) -> crate::result::Result<()> { let Resources { mecab, .. } = &mut *self.resources.lock().unwrap(); - let result = mecab.load_with_userdic(self.dict_dir.as_ref(), dict_path); - - if !result { - return Err(ErrorRepr::UseUserDict(anyhow!("辞書を読み込めませんでした。")).into()); - } - Ok(()) + mecab + .load_with_userdic(self.dict_dir.as_ref(), dict_path) + .context("辞書を読み込めませんでした。") + .map_err(ErrorRepr::UseUserDict) + .map_err(Into::into) } } @@ -188,7 +188,7 @@ pub(crate) mod blocking { } pub(crate) mod tokio { - use std::path::Path; + use camino::Utf8Path; use super::FullcontextExtractor; @@ -197,7 +197,7 @@ pub(crate) mod tokio { pub struct OpenJtalk(super::blocking::OpenJtalk); impl self::OpenJtalk { - pub async fn new(open_jtalk_dict_dir: impl AsRef) -> crate::result::Result { + pub async fn new(open_jtalk_dict_dir: impl AsRef) -> crate::result::Result { let open_jtalk_dict_dir = open_jtalk_dict_dir.as_ref().to_owned(); let blocking = crate::task::asyncify(|| super::blocking::OpenJtalk::new(open_jtalk_dict_dir)) diff --git a/crates/voicevox_core_c_api/Cargo.toml b/crates/voicevox_core_c_api/Cargo.toml index 35a2b254e..62852bdb0 100644 --- a/crates/voicevox_core_c_api/Cargo.toml +++ b/crates/voicevox_core_c_api/Cargo.toml @@ -19,6 +19,7 @@ directml = ["voicevox_core/directml"] [dependencies] anstream = { workspace = true, default-features = false, features = ["auto"] } anstyle-query.workspace = true +camino.workspace = true chrono = { workspace = true, default-features = false, features = ["clock"] } colorchoice.workspace = true cstr.workspace = true diff --git a/crates/voicevox_core_c_api/src/c_impls.rs b/crates/voicevox_core_c_api/src/c_impls.rs index 0b57db3e5..4e73bf0fb 100644 --- a/crates/voicevox_core_c_api/src/c_impls.rs +++ b/crates/voicevox_core_c_api/src/c_impls.rs @@ -1,11 +1,12 @@ use std::{ffi::CString, path::Path}; +use camino::Utf8Path; use voicevox_core::{InitializeOptions, Result, VoiceModelId}; use crate::{helpers::CApiResult, OpenJtalkRc, VoicevoxSynthesizer, VoicevoxVoiceModel}; impl OpenJtalkRc { - pub(crate) fn new(open_jtalk_dic_dir: impl AsRef) -> Result { + pub(crate) fn new(open_jtalk_dic_dir: impl AsRef) -> Result { Ok(Self { open_jtalk: voicevox_core::blocking::OpenJtalk::new(open_jtalk_dic_dir)?, }) diff --git a/crates/voicevox_core_python_api/Cargo.toml b/crates/voicevox_core_python_api/Cargo.toml index d5ca43a48..5ccd1dc41 100644 --- a/crates/voicevox_core_python_api/Cargo.toml +++ b/crates/voicevox_core_python_api/Cargo.toml @@ -12,6 +12,7 @@ cuda = ["voicevox_core/cuda"] directml = ["voicevox_core/directml"] [dependencies] +camino.workspace = true easy-ext.workspace = true log.workspace = true pyo3 = { workspace = true, features = ["abi3-py38", "extension-module"] } diff --git a/crates/voicevox_core_python_api/src/convert.rs b/crates/voicevox_core_python_api/src/convert.rs index 4b908c48b..6544ce26c 100644 --- a/crates/voicevox_core_python_api/src/convert.rs +++ b/crates/voicevox_core_python_api/src/convert.rs @@ -1,5 +1,6 @@ use std::{error::Error as _, future::Future, iter, path::PathBuf}; +use camino::Utf8PathBuf; use easy_ext::ext; use pyo3::{ exceptions::{PyException, PyValueError}, @@ -38,10 +39,12 @@ pub fn from_acceleration_mode(ob: &PyAny) -> PyResult { } } -pub fn from_utf8_path(ob: &PyAny) -> PyResult { +// FIXME: `VoiceModel`や`UserDict`についてはこれではなく、`PathBuf::extract`を直接使うようにする +pub fn from_utf8_path(ob: &PyAny) -> PyResult { PathBuf::extract(ob)? .into_os_string() .into_string() + .map(Utf8PathBuf::from) .map_err(|s| PyValueError::new_err(format!("{s:?} cannot be encoded to UTF-8"))) } diff --git a/crates/voicevox_core_python_api/src/lib.rs b/crates/voicevox_core_python_api/src/lib.rs index 9d36cafcb..4cde8d711 100644 --- a/crates/voicevox_core_python_api/src/lib.rs +++ b/crates/voicevox_core_python_api/src/lib.rs @@ -6,6 +6,7 @@ use self::convert::{ to_py_user_dict_word, to_py_uuid, to_pydantic_dataclass, to_pydantic_voice_model_meta, to_rust_user_dict_word, to_rust_uuid, VoicevoxCoreResultExt as _, }; +use camino::Utf8PathBuf; use easy_ext::ext; use log::debug; use pyo3::{ @@ -115,7 +116,7 @@ impl VoiceModel { #[staticmethod] fn from_path( py: Python<'_>, - #[pyo3(from_py_with = "from_utf8_path")] path: String, + #[pyo3(from_py_with = "from_utf8_path")] path: Utf8PathBuf, ) -> PyResult<&PyAny> { pyo3_asyncio::tokio::future_into_py(py, async move { let model = voicevox_core::tokio::VoiceModel::from_path(path).await; @@ -146,7 +147,7 @@ impl OpenJtalk { #[allow(clippy::new_ret_no_self)] #[staticmethod] fn new( - #[pyo3(from_py_with = "from_utf8_path")] open_jtalk_dict_dir: String, + #[pyo3(from_py_with = "from_utf8_path")] open_jtalk_dict_dir: Utf8PathBuf, py: Python<'_>, ) -> PyResult<&PyAny> { pyo3_asyncio::tokio::future_into_py(py, async move { @@ -637,6 +638,7 @@ impl UserDict { mod blocking { use std::sync::Arc; + use camino::Utf8PathBuf; use pyo3::{ pyclass, pymethods, types::{IntoPyDict as _, PyBytes, PyDict, PyList}, @@ -661,7 +663,7 @@ mod blocking { #[staticmethod] fn from_path( py: Python<'_>, - #[pyo3(from_py_with = "crate::convert::from_utf8_path")] path: String, + #[pyo3(from_py_with = "crate::convert::from_utf8_path")] path: Utf8PathBuf, ) -> PyResult { let model = voicevox_core::blocking::VoiceModel::from_path(path).into_py_result(py)?; Ok(Self { model }) @@ -688,7 +690,7 @@ mod blocking { impl OpenJtalk { #[new] fn new( - #[pyo3(from_py_with = "super::from_utf8_path")] open_jtalk_dict_dir: String, + #[pyo3(from_py_with = "super::from_utf8_path")] open_jtalk_dict_dir: Utf8PathBuf, py: Python<'_>, ) -> PyResult { let open_jtalk =